QOJ.ac

QOJ

IDProblemSubmitterResultTimeMemoryLanguageFile sizeSubmit timeJudge time
#657703#9486. Random Mexucup-team159#AC ✓1132ms629936kbC++2353.6kb2024-10-19 15:16:432024-10-19 15:16:44

Judging History

你现在查看的是最新测评结果

  • [2024-10-19 15:16:44]
  • 评测
  • 测评结果:AC
  • 用时:1132ms
  • 内存:629936kb
  • [2024-10-19 15:16:43]
  • 提交

answer

#line 2 "/home/vscode/fastfps/src/fastfps/modint.hpp"

#include <vector>
#pragma GCC target("avx2,bmi,bmi2,lzcnt,popcnt")

#include <array>
#include <cassert>
#include <iostream>

#line 1 "/home/vscode/fastfps/src/fastfps/types.hpp"
#include <cstdint>

namespace fastfps {

using i32 = int32_t;
using u32 = uint32_t;
using i64 = int64_t;
using u64 = uint64_t;

}  // namespace fastfps
#line 8 "/home/vscode/fastfps/src/fastfps/modint.hpp"

namespace fastfps {

// x * inv_u32(x) = 1 (mod 2^32)
constexpr u32 inv_u32(const u32 x) {
    assert(x % 2);
    u32 inv = 1;
    for (int i = 0; i < 5; i++) {
        inv *= 2u - inv * x;
    }
    return inv;
}

template <u32 MOD> struct ModInt {
    static_assert(MOD % 2 && MOD <= (1U << 30) - 1,
                  "mod must be odd and at most 2^30 - 1");

    static constexpr u32 mod() { return MOD; }

    constexpr ModInt() : x(0) {}
    constexpr explicit ModInt(u32 _x) : x(mulreduce(_x, B2)) {}

    constexpr ModInt(std::signed_integral auto _x)
        : ModInt((u32)(_x % (i32)MOD + MOD)) {}
    constexpr ModInt(std::unsigned_integral auto _x)
        : ModInt((u32)(_x % MOD)) {}

    constexpr u32 val() const {
        u32 y = mulreduce(x, 1);
        return y < MOD ? y : y - MOD;
    }
    constexpr u32 internal_val() const { return x; }

    constexpr ModInt& operator+=(const ModInt& rhs) {
        x += rhs.x;
        x = std::min(x, x - 2 * MOD);
        return *this;
    }
    constexpr friend ModInt operator+(const ModInt& lhs, const ModInt& rhs) {
        return ModInt(lhs) += rhs;
    }

    constexpr ModInt& operator-=(const ModInt& rhs) {
        x += 2 * MOD - rhs.x;
        x = std::min(x, x - 2 * MOD);
        return *this;
    }
    constexpr friend ModInt operator-(const ModInt& lhs, const ModInt& rhs) {
        return ModInt(lhs) -= rhs;
    }

    constexpr ModInt& operator*=(const ModInt& rhs) {
        x = mulreduce(x, rhs.x);
        return *this;
    }
    constexpr friend ModInt operator*(const ModInt& lhs, const ModInt& rhs) {
        return ModInt(lhs) *= rhs;
    }

    friend bool operator==(const ModInt& lhs, const ModInt& rhs) {
        auto lx = lhs.x;
        if (lx >= MOD) lx -= MOD;
        auto rx = rhs.x;
        if (rx >= MOD) rx -= MOD;
        return lx == rx;
    }

    constexpr ModInt pow(u64 n) const {
        ModInt v = *this, r = 1;
        while (n) {
            if (n & 1) r *= v;
            v *= v;
            n >>= 1;
        }
        return r;
    }
    constexpr ModInt inv() const {
        // TODO: for non-prime
        return pow(MOD - 2);
    }

    friend std::ostream& operator<<(std::ostream& os, const ModInt& v) {
        return os << v.val();
    }

  private:
    u32 x;

    static constexpr u32 B = ((u64(1) << 32)) % MOD;
    static constexpr u32 B2 = u64(1) * B * B % MOD;
    static constexpr u32 INV = -inv_u32(MOD);

    // Input: (l * r) must be no more than (2^32 * MOD)
    // Output: ((l * r) / 2^32) % MOD
    static constexpr u32 mulreduce(u32 l, u32 r) {
        u64 x = u64(1) * l * r;
        x += u64(u32(x) * INV) * MOD;
        return u32(x >> 32);
    }
};

template <typename T> struct is_modint : std::false_type {};
template <u32 MOD> struct is_modint<ModInt<MOD>> : std::true_type {};

}  // namespace fastfps
#line 2 "ucup3-13/K/main.cpp"
#define YOSUPO_AVX2_PRAGMA
// #undef YOSUPO_LOCAL

#line 2 "/home/vscode/yosupo-library/src/yosupo/fastio.hpp"

#include <unistd.h>
#include <algorithm>
#line 6 "/home/vscode/yosupo-library/src/yosupo/fastio.hpp"
#include <bit>
#line 8 "/home/vscode/yosupo-library/src/yosupo/fastio.hpp"
#include <cctype>
#line 10 "/home/vscode/yosupo-library/src/yosupo/fastio.hpp"
#include <cstring>
#include <sstream>
#include <string>
#include <type_traits>
#include <vector>

#line 2 "/home/vscode/yosupo-library/src/yosupo/internal_type_traits.hpp"

#line 5 "/home/vscode/yosupo-library/src/yosupo/internal_type_traits.hpp"

namespace yosupo {

namespace internal {

template <class T>
using is_signed_int128 =
    typename std::conditional<std::is_same<T, __int128_t>::value ||
                                  std::is_same<T, __int128>::value,
                              std::true_type,
                              std::false_type>::type;

template <class T>
using is_unsigned_int128 =
    typename std::conditional<std::is_same<T, __uint128_t>::value ||
                                  std::is_same<T, unsigned __int128>::value,
                              std::true_type,
                              std::false_type>::type;

template <class T>
using make_unsigned_int128 =
    typename std::conditional<std::is_same<T, __int128_t>::value,
                              __uint128_t,
                              unsigned __int128>;

template <class T>
using is_integral =
    typename std::conditional<std::is_integral<T>::value ||
                                  internal::is_signed_int128<T>::value ||
                                  internal::is_unsigned_int128<T>::value,
                              std::true_type,
                              std::false_type>::type;

template <class T>
using is_signed_int = typename std::conditional<(is_integral<T>::value &&
                                                 std::is_signed<T>::value) ||
                                                    is_signed_int128<T>::value,
                                                std::true_type,
                                                std::false_type>::type;

template <class T>
using is_unsigned_int =
    typename std::conditional<(is_integral<T>::value &&
                               std::is_unsigned<T>::value) ||
                                  is_unsigned_int128<T>::value,
                              std::true_type,
                              std::false_type>::type;

template <class T>
using to_unsigned = typename std::conditional<
    is_signed_int128<T>::value,
    make_unsigned_int128<T>,
    typename std::conditional<std::is_signed<T>::value,
                              std::make_unsigned<T>,
                              std::common_type<T>>::type>::type;

template <class T>
using is_integral_t = std::enable_if_t<is_integral<T>::value>;

template <class T>
using is_signed_int_t = std::enable_if_t<is_signed_int<T>::value>;

template <class T>
using is_unsigned_int_t = std::enable_if_t<is_unsigned_int<T>::value>;

template <class T> using to_unsigned_t = typename to_unsigned<T>::type;

}  // namespace internal

}  // namespace yosupo
#line 17 "/home/vscode/yosupo-library/src/yosupo/fastio.hpp"

namespace yosupo {

struct Scanner {
  public:
    Scanner(const Scanner&) = delete;
    Scanner& operator=(const Scanner&) = delete;

    Scanner(FILE* fp) : fd(fileno(fp)) { line[0] = 127; }

    void read() {}
    template <class H, class... T> void read(H& h, T&... t) {
        bool f = read_single(h);
        assert(f);
        read(t...);
    }

    int read_unsafe() { return 0; }
    template <class H, class... T> int read_unsafe(H& h, T&... t) {
        bool f = read_single(h);
        if (!f) return 0;
        return 1 + read_unsafe(t...);
    }

    int close() { return ::close(fd); }

  private:
    static constexpr int SIZE = 1 << 15;

    int fd = -1;
    std::array<char, SIZE + 1> line;
    int st = 0, ed = 0;
    bool eof = false;

    bool read_single(std::string& ref) {
        if (!skip_space()) return false;
        ref = "";
        while (true) {
            char c = top();
            if (c <= ' ') break;
            ref += c;
            st++;
        }
        return true;
    }
    bool read_single(double& ref) {
        std::string s;
        if (!read_single(s)) return false;
        ref = std::stod(s);
        return true;
    }

    template <class T,
              std::enable_if_t<std::is_same<T, char>::value>* = nullptr>
    bool read_single(T& ref) {
        if (!skip_space<50>()) return false;
        ref = top();
        st++;
        return true;
    }

    template <class T,
              internal::is_signed_int_t<T>* = nullptr,
              std::enable_if_t<!std::is_same<T, char>::value>* = nullptr>
    bool read_single(T& sref) {
        using U = internal::to_unsigned_t<T>;
        if (!skip_space<50>()) return false;
        bool neg = false;
        if (line[st] == '-') {
            neg = true;
            st++;
        }
        U ref = 0;
        do {
            ref = 10 * ref + (line[st++] & 0x0f);
        } while (line[st] >= '0');
        sref = neg ? -ref : ref;
        return true;
    }
    template <class U,
              internal::is_unsigned_int_t<U>* = nullptr,
              std::enable_if_t<!std::is_same<U, char>::value>* = nullptr>
    bool read_single(U& ref) {
        if (!skip_space<50>()) return false;
        ref = 0;
        do {
            ref = 10 * ref + (line[st++] & 0x0f);
        } while (line[st] >= '0');
        return true;
    }

    bool reread() {
        if (ed - st >= 50) return true;
        if (st > SIZE / 2) {
            std::memmove(line.data(), line.data() + st, ed - st);
            ed -= st;
            st = 0;
        }
        if (eof) return false;
        auto u = ::read(fd, line.data() + ed, SIZE - ed);
        if (u == 0) {
            eof = true;
            line[ed] = '\0';
            u = 1;
        }
        ed += int(u);
        line[ed] = char(127);
        return true;
    }

    char top() {
        if (st == ed) {
            bool f = reread();
            assert(f);
        }
        return line[st];
    }

    template <int TOKEN_LEN = 0> bool skip_space() {
        while (true) {
            while (line[st] <= ' ') st++;
            if (ed - st > TOKEN_LEN) return true;
            if (st > ed) st = ed;
            for (auto i = st; i < ed; i++) {
                if (line[i] <= ' ') return true;
            }
            if (!reread()) return false;
        }
    }
};

struct Printer {
  public:
    template <char sep = ' ', bool F = false> void write() {}
    template <char sep = ' ', bool F = false, class H, class... T>
    void write(const H& h, const T&... t) {
        if (F) write_single(sep);
        write_single(h);
        write<true>(t...);
    }
    template <char sep = ' ', class... T> void writeln(const T&... t) {
        write<sep>(t...);
        write_single('\n');
    }

    Printer(FILE* _fp) : fd(fileno(_fp)) {}
    ~Printer() { flush(); }

    int close() {
        flush();
        return ::close(fd);
    }

    void flush() {
        if (pos) {
            auto res = ::write(fd, line.data(), pos);
            assert(res != -1);
            pos = 0;
        }
    }

  private:
    static std::array<std::array<char, 2>, 100> small;
    static std::array<unsigned long long, 20> tens;

    static constexpr size_t SIZE = 1 << 15;
    int fd;
    std::array<char, SIZE> line;
    size_t pos = 0;
    std::stringstream ss;

    template <class T,
              std::enable_if_t<std::is_same<char, T>::value>* = nullptr>
    void write_single(const T& val) {
        if (pos == SIZE) flush();
        line[pos++] = val;
    }

    template <class T,
              internal::is_signed_int_t<T>* = nullptr,
              std::enable_if_t<!std::is_same<char, T>::value>* = nullptr>
    void write_single(const T& val) {
        using U = internal::to_unsigned_t<T>;
        if (val == 0) {
            write_single('0');
            return;
        }
        if (pos > SIZE - 50) flush();
        U uval = val;
        if (val < 0) {
            write_single('-');
            uval = -uval;
        }
        write_unsigned(uval);
    }

    template <class U,
              internal::is_unsigned_int_t<U>* = nullptr,
              std::enable_if_t<!std::is_same<char, U>::value>* = nullptr>
    void write_single(U uval) {
        if (uval == 0) {
            write_single('0');
            return;
        }
        if (pos > SIZE - 50) flush();

        write_unsigned(uval);
    }

    static int calc_len(uint64_t x) {
        int i = ((63 - std::countl_zero(x)) * 3 + 3) / 10;
        if (x < tens[i])
            return i;
        else
            return i + 1;
    }

    template <class U,
              internal::is_unsigned_int_t<U>* = nullptr,
              std::enable_if_t<2 >= sizeof(U)>* = nullptr>
    void write_unsigned(U uval) {
        size_t len = calc_len(uval);
        pos += len;

        char* ptr = line.data() + pos;
        while (uval >= 100) {
            ptr -= 2;
            memcpy(ptr, small[uval % 100].data(), 2);
            uval /= 100;
        }
        if (uval >= 10) {
            memcpy(ptr - 2, small[uval].data(), 2);
        } else {
            *(ptr - 1) = char('0' + uval);
        }
    }

    template <class U,
              internal::is_unsigned_int_t<U>* = nullptr,
              std::enable_if_t<4 == sizeof(U)>* = nullptr>
    void write_unsigned(U uval) {
        std::array<char, 8> buf;
        memcpy(buf.data() + 6, small[uval % 100].data(), 2);
        memcpy(buf.data() + 4, small[uval / 100 % 100].data(), 2);
        memcpy(buf.data() + 2, small[uval / 10000 % 100].data(), 2);
        memcpy(buf.data() + 0, small[uval / 1000000 % 100].data(), 2);

        if (uval >= 100000000) {
            if (uval >= 1000000000) {
                memcpy(line.data() + pos, small[uval / 100000000 % 100].data(),
                       2);
                pos += 2;
            } else {
                line[pos] = char('0' + uval / 100000000);
                pos++;
            }
            memcpy(line.data() + pos, buf.data(), 8);
            pos += 8;
        } else {
            size_t len = calc_len(uval);
            memcpy(line.data() + pos, buf.data() + (8 - len), len);
            pos += len;
        }
    }

    template <class U,
              internal::is_unsigned_int_t<U>* = nullptr,
              std::enable_if_t<8 == sizeof(U)>* = nullptr>
    void write_unsigned(U uval) {
        size_t len = calc_len(uval);
        pos += len;

        char* ptr = line.data() + pos;
        while (uval >= 100) {
            ptr -= 2;
            memcpy(ptr, small[uval % 100].data(), 2);
            uval /= 100;
        }
        if (uval >= 10) {
            memcpy(ptr - 2, small[uval].data(), 2);
        } else {
            *(ptr - 1) = char('0' + uval);
        }
    }

    template <
        class U,
        std::enable_if_t<internal::is_unsigned_int128<U>::value>* = nullptr>
    void write_unsigned(U uval) {
        static std::array<char, 50> buf;
        size_t len = 0;
        while (uval > 0) {
            buf[len++] = char((uval % 10) + '0');
            uval /= 10;
        }
        std::reverse(buf.begin(), buf.begin() + len);
        memcpy(line.data() + pos, buf.data(), len);
        pos += len;
    }

    void write_single(const std::string& s) {
        for (char c : s) write_single(c);
    }
    void write_single(const char* s) {
        size_t len = strlen(s);
        for (size_t i = 0; i < len; i++) write_single(s[i]);
    }
    template <class T> void write_single(const std::vector<T>& val) {
        auto n = val.size();
        for (size_t i = 0; i < n; i++) {
            if (i) write_single(' ');
            write_single(val[i]);
        }
    }
};

inline std::array<std::array<char, 2>, 100> Printer::small = [] {
    std::array<std::array<char, 2>, 100> table;
    for (int i = 0; i <= 99; i++) {
        table[i][1] = char('0' + (i % 10));
        table[i][0] = char('0' + (i / 10 % 10));
    }
    return table;
}();
inline std::array<unsigned long long, 20> Printer::tens = [] {
    std::array<unsigned long long, 20> table;
    for (int i = 0; i < 20; i++) {
        table[i] = 1;
        for (int j = 0; j < i; j++) {
            table[i] *= 10;
        }
    }
    return table;
}();

}  // namespace yosupo
#line 2 "/home/vscode/yosupo-library/src/yosupo/random.hpp"

#line 6 "/home/vscode/yosupo-library/src/yosupo/random.hpp"
#include <chrono>
#line 8 "/home/vscode/yosupo-library/src/yosupo/random.hpp"
#include <random>
#line 10 "/home/vscode/yosupo-library/src/yosupo/random.hpp"

namespace yosupo {

struct Xoshiro256StarStar {
  public:
    using result_type = uint64_t;
    Xoshiro256StarStar() : Xoshiro256StarStar(0) {}
    explicit Xoshiro256StarStar(uint64_t seed) {
        // use splitmix64
        // Reference: http://xoshiro.di.unimi.it/splitmix64.c
        for (int i = 0; i < 4; i++) {
            uint64_t z = (seed += 0x9e3779b97f4a7c15);
            z = (z ^ (z >> 30)) * 0xbf58476d1ce4e5b9;
            z = (z ^ (z >> 27)) * 0x94d049bb133111eb;
            s[i] = z ^ (z >> 31);
        }
    }

    static constexpr result_type min() { return 0; }
    static constexpr result_type max() { return -1; }

    result_type operator()() {
        const uint64_t result_starstar = rotl(s[1] * 5, 7) * 9;

        const uint64_t t = s[1] << 17;

        s[2] ^= s[0];
        s[3] ^= s[1];
        s[1] ^= s[2];
        s[0] ^= s[3];

        s[2] ^= t;

        s[3] = rotl(s[3], 45);

        return result_starstar;
    }

  private:
    // Use xoshiro256**
    // Refereces: http://xoshiro.di.unimi.it/xoshiro256starstar.c
    static uint64_t rotl(const uint64_t x, int k) {
        return (x << k) | (x >> (64 - k));
    }

    std::array<uint64_t, 4> s;
};

// https://github.com/wangyi-fudan/wyhash
struct WYRand {
  public:
    using result_type = uint64_t;
    explicit WYRand(uint64_t seed) : s(seed) {}

    static constexpr result_type min() { return 0; }
    static constexpr result_type max() { return -1; }

    result_type operator()() {
        s += 0x2d358dccaa6c78a5;
        auto x = (unsigned __int128)s * (s ^ 0x8bb84b93962eacc9);
        return (uint64_t)(x ^ (x >> 64));
    }

  private:
    uint64_t s;
};
using Random = WYRand;
inline Random& global_gen() {
    static Random gen(
        std::chrono::steady_clock::now().time_since_epoch().count());
    return gen;
}

template <class G>
concept random_64 = std::uniform_random_bit_generator<G> &&
                    std::same_as<uint64_t, std::invoke_result_t<G&>> &&
                    G::min() == uint64_t(0) && G::max() == uint64_t(-1);

namespace internal {

// random choice from [0, upper]
template <random_64 G> uint64_t uniform_u64(uint64_t upper, G& gen) {
    if (!(upper & (upper + 1))) {
        // b = 00..0011..11
        return gen() & upper;
    }
    int log = 63 - std::countl_zero(upper);
    uint64_t mask = (log == 63) ? ~0ULL : (1ULL << (log + 1)) - 1;
    while (true) {
        uint64_t r = gen() & mask;
        if (r <= upper) return r;
    }
}

// random choice from [0, upper], faster than uniform_u64
template <random_64 G> uint64_t random_u64(uint64_t upper, G& gen) {
    return (uint64_t)(((unsigned __int128)(upper) + 1) * gen() >> 64);
}

}  // namespace internal

template <class T, random_64 G> T uniform(T lower, T upper, G& gen) {
    return T(lower +
             internal::uniform_u64(uint64_t(upper) - uint64_t(lower), gen));
}
template <class T> T uniform(T lower, T upper) {
    return uniform(lower, upper, global_gen());
}
template <class T, random_64 G> T random(T lower, T upper, G& gen) {
    return T(lower +
             internal::random_u64(uint64_t(upper) - uint64_t(lower), gen));
}
template <class T> T random(T lower, T upper) {
    return random(lower, upper, global_gen());
}

template <random_64 G> bool uniform_bool(G& gen) { return gen() & 1; }
inline bool uniform_bool() { return uniform_bool(global_gen()); }

// select 2 elements from [lower, uppper]
template <class T, random_64 G>
std::pair<T, T> uniform_pair(T lower, T upper, G& gen) {
    assert(upper - lower >= 1);
    T a, b;
    do {
        a = uniform(lower, upper, gen);
        b = uniform(lower, upper, gen);
    } while (a == b);
    if (a > b) std::swap(a, b);
    return {a, b};
}
template <class T> std::pair<T, T> uniform_pair(T lower, T upper) {
    return uniform_pair(lower, upper, global_gen());
}

// random value in the interval (0.0, 1.0]
template <class G> inline double open_closed_01(G& gen) {
    union {
        uint64_t i;
        double f;
    } u = {0xbff0000000000000 | (gen() >> 12)};
    return 2.0 + u.f;
}
inline double open_closed_01() {
    return open_closed_01(global_gen());
}

}  // namespace yosupo
#line 2 "/home/vscode/fastfps/src/fastfps/modvec.hpp"

#line 6 "/home/vscode/fastfps/src/fastfps/modvec.hpp"

#line 2 "/home/vscode/fastfps/src/fastfps/fft.hpp"

#line 5 "/home/vscode/fastfps/src/fastfps/fft.hpp"
#include <concepts>
#include <ranges>
#line 8 "/home/vscode/fastfps/src/fastfps/fft.hpp"

#line 2 "/home/vscode/fastfps/src/fastfps/math.hpp"

#line 2 "/home/vscode/fastfps/src/fastfps/types.hpp"

namespace fastfps {

using i32 = int32_t;
using u32 = uint32_t;
using i64 = int64_t;
using u64 = uint64_t;

}  // namespace fastfps
#line 4 "/home/vscode/fastfps/src/fastfps/math.hpp"

namespace fastfps {

constexpr u32 pow_mod_constexpr(u64 x, u64 n, u32 m) {
    if (m == 1) return 0;
    x %= m;

    u64 r = 1;
    while (n) {
        if (n & 1) r = (r * x) % m;
        x = (x * x) % m;
        n >>= 1;
    }

    return (u32)(r);
}

constexpr u32 primitive_root_constexpr(u32 m) {
    if (m == 2) return 1;

    u32 divs[20] = {};
    int cnt = 0;
    u32 x = (m - 1) / 2;
    for (int i = 2; (u64)(i)*i <= x; i += 2) {
        if (x % i == 0) {
            divs[cnt++] = i;
            while (x % i == 0) {
                x /= i;
            }
        }
    }
    if (x > 1) {
        divs[cnt++] = x;
    }
    for (u32 g = 2;; g++) {
        bool ok = true;
        for (int i = 0; i < cnt; i++) {
            if (pow_mod_constexpr(g, (m - 1) / divs[i], m) == 1) {
                ok = false;
                break;
            }
        }
        if (ok) return g;
    }
}
template <u32 m> constexpr u32 primitive_root = primitive_root_constexpr(m);

}  // namespace fastfps
#line 2 "/home/vscode/fastfps/src/fastfps/modint8.hpp"

#include <immintrin.h>


#line 10 "/home/vscode/fastfps/src/fastfps/modint8.hpp"
#include <span>

#line 2 "/home/vscode/fastfps/src/fastfps/types.hpp"

namespace fastfps {

using i32 = int32_t;
using u32 = uint32_t;
using i64 = int64_t;
using u64 = uint64_t;

}  // namespace fastfps
#line 15 "/home/vscode/fastfps/src/fastfps/modint8.hpp"

namespace fastfps {

template <u32 MOD> struct ModInt8 {
    using modint = ModInt<MOD>;
    using m256i_u = __m256i_u;

    static_assert(MOD % 2 && MOD <= (1U << 30) - 1,
                  "mod must be odd and at most 2^30 - 1");

    static constexpr u32 mod() { return MOD; }

    ModInt8() : x(_mm256_setzero_si256()) {}
    ModInt8(std::span<const i32, 8> _x)
        : x(mul(_mm256_sub_epi32(_mm256_loadu_si256((m256i_u*)_x.data()),
                                 _mm256_set1_epi32(u32(1) << 31)),
                _mm256_set1_epi32(B2))) {
        static const ModInt8 OFFSET = set1(u32(1) << 31);
        *this -= OFFSET;
    }
    ModInt8(std::span<const u32, 8> _x)
        : x(mul(_mm256_loadu_si256((m256i_u*)_x.data()),
                _mm256_set1_epi32(B2))) {}
    ModInt8(std::span<const modint, 8> _x)
        : x(_mm256_loadu_si256((m256i_u*)_x.data())) {
        static_assert(sizeof(modint) == 4);
    }
    explicit ModInt8(modint x0,
                     modint x1,
                     modint x2,
                     modint x3,
                     modint x4,
                     modint x5,
                     modint x6,
                     modint x7)
        : x(_mm256_set_epi32(x7.internal_val(),
                             x6.internal_val(),
                             x5.internal_val(),
                             x4.internal_val(),
                             x3.internal_val(),
                             x2.internal_val(),
                             x1.internal_val(),
                             x0.internal_val())) {}

    static ModInt8 set1(modint x) {
        ModInt8 v;
        v.x = _mm256_set1_epi32(x.internal_val());
        return v;
    }

    std::array<u32, 8> val() const {
        const m256i_u MOD_X = _mm256_set1_epi32(MOD);

        auto a = mul(x, _mm256_set1_epi32(1));
        alignas(32) std::array<u32, 8> b;
        _mm256_storeu_si256((__m256i_u*)b.data(),
                            min(a, _mm256_sub_epi32(a, MOD_X)));
        return b;
    }

    ModInt8& operator+=(const ModInt8& rhs) {
        const m256i_u MOD2_X = _mm256_set1_epi32(2 * MOD);

        x = _mm256_add_epi32(x, rhs.x);
        x = min(x, _mm256_sub_epi32(x, MOD2_X));
        return *this;
    }
    friend ModInt8 operator+(const ModInt8& lhs, const ModInt8& rhs) {
        return ModInt8(lhs) += rhs;
    }

    ModInt8& operator-=(const ModInt8& rhs) {
        const m256i_u MOD2_X = _mm256_set1_epi32(2 * MOD);

        x = _mm256_sub_epi32(x, rhs.x);
        x = min(x, _mm256_add_epi32(x, MOD2_X));
        return *this;
    }
    friend ModInt8 operator-(const ModInt8& lhs, const ModInt8& rhs) {
        return ModInt8(lhs) -= rhs;
    }

    ModInt8& operator*=(const ModInt8& rhs) {
        x = mul(x, rhs.x);
        return *this;
    }
    friend ModInt8 operator*(const ModInt8& lhs, const ModInt8& rhs) {
        return ModInt8(lhs) *= rhs;
    }

    ModInt8 operator-() const { return ModInt8() - *this; }

    friend bool operator==(const ModInt8& lhs, const ModInt8& rhs) {
        const m256i_u MOD_X = _mm256_set1_epi32(MOD);

        auto lx = lhs.x, rx = rhs.x;
        lx = min(lx, _mm256_sub_epi32(lx, MOD_X));
        rx = min(rx, _mm256_sub_epi32(rx, MOD_X));
        auto z = _mm256_xor_si256(lx, rx);
        return _mm256_testz_si256(z, z);
    }

    // a.permutevar(idx)[i] = a[idx[i] % 8]
    ModInt8 permutevar(const std::array<u32, 8>& idx) const {
        return permutevar(_mm256_loadu_si256((m256i_u*)idx.data()));
    }

    // a[i] <- a[(middle + i) % 8]
    ModInt8 rotate(u32 middle) const {
        static const m256i_u base = _mm256_set_epi32(7, 6, 5, 4, 3, 2, 1, 0);
        return permutevar(_mm256_add_epi32(base, _mm256_set1_epi32(middle)));
    }

    template <uint8_t MASK>
    friend ModInt8 blend(const ModInt8& lhs, const ModInt8& rhs) {
        ModInt8 v;
        v.x = _mm256_blend_epi32(lhs.x, rhs.x, MASK);
        return v;
    }

    friend ModInt8 blendvar(const ModInt8& lhs,
                            const ModInt8& rhs,
                            const std::array<u32, 8>& idx) {
        ModInt8 v;
        v.x = _mm256_blendv_epi8(
            rhs.x, lhs.x,
            _mm256_cmpeq_epi32(_mm256_loadu_si256((m256i_u*)idx.data()),
                               _mm256_setzero_si256()));
        return v;
    }

  private:
    m256i_u x;

    //inline static const m256i_u MOD_X = _mm256_set1_epi32(MOD);
    //inline static const m256i_u MOD2_X = _mm256_set1_epi32(2 * MOD);
    //inline static const m256i_u N_INV_X = _mm256_set1_epi32(-inv_u32(MOD));
    //inline static const m256i_u INT_MIN_X = _mm256_set1_epi32(u32(1) << 31);

    static constexpr u32 B2 = pow_mod_constexpr(2, 64, MOD);
    inline static const m256i_u B2_X = _mm256_set1_epi32(B2);

    // Input: l * r <= 2^32 * MOD
    // Output: l * r >>= 2^32
    static m256i_u mul(const m256i_u& l, const m256i_u& r) {
        const m256i_u MOD_X = _mm256_set1_epi32(MOD);
        const m256i_u N_INV_X = _mm256_set1_epi32(-inv_u32(MOD));

        auto x0 = mul_even(l, r);
        auto x1 = mul_even(_mm256_shuffle_epi32(l, 0xf5),
                           _mm256_shuffle_epi32(r, 0xf5));
        x0 += mul_even(mul_even(x0, N_INV_X), MOD_X);
        x1 += mul_even(mul_even(x1, N_INV_X), MOD_X);

        x0 = _mm256_srli_epi64(x0, 32);
        return _mm256_blend_epi32(x0, x1, 0b10101010);
    }
    // (lr[0], lr[2], lr[4], lr[6])
    static m256i_u mul_even(const m256i_u& l, const m256i_u& r) {
        return _mm256_mul_epu32(l, r);
    }

    static m256i_u min(const m256i_u& l, const m256i_u& r) {
        return _mm256_min_epu32(l, r);
    }
    static m256i_u max(const m256i_u& l, const m256i_u& r) {
        return _mm256_max_epu32(l, r);
    }

    // a.permutevar(idx)[i] = a[idx[i] % 8]
    ModInt8 permutevar(const m256i_u& idx) const {
        ModInt8 v;
        v.x = _mm256_permutevar8x32_epi32(x, idx);
        return v;
    }
};


template <typename T> struct is_modint8 : std::false_type {};
template <u32 MOD> struct is_modint8<ModInt8<MOD>> : std::true_type {};

}  // namespace fastfps
#line 2 "/home/vscode/fastfps/src/fastfps/types.hpp"

namespace fastfps {

using i32 = int32_t;
using u32 = uint32_t;
using i64 = int64_t;
using u64 = uint64_t;

}  // namespace fastfps
#line 13 "/home/vscode/fastfps/src/fastfps/fft.hpp"

namespace fastfps {

template <u32 MOD> struct FFTInfo {
    using modint = ModInt<MOD>;
    using modint8 = ModInt8<MOD>;

    static constexpr u32 g = primitive_root<MOD>;
    static constexpr int ord2 = std::countr_zero(MOD - 1);

    // w[i]^(2^i) == 1 : w[i] is the fft omega of n=2^i
    static constexpr std::array<modint, ord2 + 1> w = []() {
        std::array<modint, ord2 + 1> v;
        v[ord2] = modint(g).pow((MOD - 1) >> ord2);
        for (int i = ord2 - 1; i >= 0; i--) {
            v[i] = v[i + 1] * v[i + 1];
        }
        return v;
    }();
    static constexpr std::array<modint, ord2 + 1> iw = []() {
        std::array<modint, ord2 + 1> v;
        v[ord2] = w[ord2].inv();
        for (int i = ord2 - 1; i >= 0; i--) {
            v[i] = v[i + 1] * v[i + 1];
        }
        return v;
    }();

    static constexpr std::array<modint, ord2 + 1> rot8 = []() {
        std::array<modint, std::max(0, ord2 + 1)> v;
        for (int i = 3; i <= ord2; i++) {
            v[i] = w[i];
            for (int j = 3; j < i; j++) {
                v[i] *= iw[j];
            }
        }
        return v;
    }();
    static constexpr std::array<modint, ord2 + 1> irot8 = []() {
        std::array<modint, std::max(0, ord2 + 1)> v;
        for (int i = 3; i <= ord2; i++) {
            v[i] = iw[i];
            for (int j = 3; j < i; j++) {
                v[i] *= w[j];
            }
        }
        return v;
    }();
    // rot[i] * rot_shift8(i) = rot[i + 8]
    modint rot_shift8(u32 i) const { return rot8[std::countr_one(i >> 3) + 3]; }
    modint irot_shift8(u32 i) const {
        return irot8[std::countr_one(i >> 3) + 3];
    }

    static constexpr std::array<modint, ord2 + 1> rot4 = []() {
        std::array<modint, std::max(0, ord2 + 1)> v;
        for (int i = 4; i <= ord2; i++) {
            v[i] = w[i];
            for (int j = 4; j < i; j++) {
                v[i] *= iw[j];
            }
        }
        return v;
    }();
    static constexpr std::array<modint, ord2 + 1> irot4 = []() {
        std::array<modint, std::max(0, ord2 + 1)> v;
        for (int i = 4; i <= ord2; i++) {
            v[i] = iw[i];
            for (int j = 4; j < i; j++) {
                v[i] *= w[j];
            }
        }
        return v;
    }();
    std::array<modint8, ord2 + 1> rot16i = []() {
        std::array<modint8, std::max(0, ord2 + 1)> v;
        for (int i = 4; i <= ord2; i++) {
            std::array<modint, 8> buf;
            buf[0] = 1;
            for (int j = 1; j < 8; j++) {
                buf[j] = buf[j - 1] * rot4[i];
            }
            v[i] = modint8(buf);
        }
        return v;
    }();
    std::array<modint8, ord2 + 1> irot16i = []() {
        std::array<modint8, std::max(0, ord2 + 1)> v;
        for (int i = 4; i <= ord2; i++) {
            std::array<modint, 8> buf;
            buf[0] = 1;
            for (int j = 1; j < 8; j++) {
                buf[j] = buf[j - 1] * irot4[i];
            }
            v[i] = modint8(buf);
        }
        return v;
    }();
    // rot[i * j] * rot_shift16i(i)[j] = rot[(i + 8) * j]
    modint8 rot_shift16i(u32 i) const {
        return rot16i[std::countr_one(i >> 4) + 4];
    }
    modint8 irot_shift16i(u32 i) const {
        return irot16i[std::countr_one(i >> 4) + 4];
    }
};
template <u32 MOD> const FFTInfo<MOD> fft_info = FFTInfo<MOD>();

template <u32 MOD> ModInt8<MOD> fft_single(ModInt8<MOD> x) {
    static const FFTInfo<MOD>& info = fft_info<MOD>;
    static const ModInt<MOD> w4 = info.w[2], w8 = info.w[3];
    static const auto step4 = ModInt8<MOD>(1, 1, 1, w4, 1, 1, 1, w4);
    static const auto step8 =
        ModInt8<MOD>(1, 1, 1, 1, 1, w8, w8 * w8, w8 * w8 * w8);

    x = (blend<0b11110000>(x, -x) + x.permutevar({4, 5, 6, 7, 0, 1, 2, 3})) *
        step8;
    x = (blend<0b11001100>(x, -x) + x.permutevar({2, 3, 0, 1, 6, 7, 4, 5})) *
        step4;
    x = (blend<0b10101010>(x, -x) + x.permutevar({1, 0, 3, 2, 5, 4, 7, 6}));
    return x;
}

template <u32 MOD> ModInt8<MOD> ifft_single(ModInt8<MOD> x) {
    static const FFTInfo<MOD>& info = fft_info<MOD>;
    static const ModInt<MOD> iw4 = info.iw[2], iw8 = info.iw[3];
    static const auto step4 = ModInt8<MOD>(1, 1, 1, iw4, 1, 1, 1, iw4);
    static const auto step8 =
        ModInt8<MOD>(1, 1, 1, 1, 1, iw8, iw8 * iw8, iw8 * iw8 * iw8);

    x = (blend<0b10101010>(x, -x) + x.permutevar({1, 0, 3, 2, 5, 4, 7, 6})) *
        step4;
    x = (blend<0b11001100>(x, -x) + x.permutevar({2, 3, 0, 1, 6, 7, 4, 5})) *
        step8;
    x = (blend<0b11110000>(x, -x) + x.permutevar({4, 5, 6, 7, 0, 1, 2, 3}));

    return x;
}

template <std::ranges::random_access_range R>
    requires is_modint8<std::ranges::range_value_t<R>>::value
void fft(R&& a) {
    using modint8 = std::ranges::range_value_t<R>;
    static constexpr u32 MOD = modint8::mod();

    static const FFTInfo<MOD>& info = fft_info<MOD>;

    const int n = int(a.size());
    const int lg = std::countr_zero((u32)n);

    int h = lg;
    if (h % 2) {
        // 2-base
        int len = n / 2;
        for (int i = 0; i < len; i++) {
            auto l = a[0 * len + i];
            auto r = a[1 * len + i];
            a[0 * len + i] = l + r;
            a[1 * len + i] = l - r;
        }
        h--;
    }
    while (h >= 2) {
        // 4-base
        static const modint8 w2 = modint8::set1(info.w[2]);

        modint8 rotx = modint8::set1(1);
        for (int start = 0; start < n; start += (1 << h)) {
            const modint8 rot2x = rotx * rotx;
            const modint8 rot3x = rot2x * rotx;

            int len = 1 << (h - 2);
            for (int i = 0; i < len; i++) {
                auto a0 = a[start + 0 * len + i];
                auto a1 = a[start + 1 * len + i] * rotx;
                auto a2 = a[start + 2 * len + i] * rot2x;
                auto a3 = a[start + 3 * len + i] * rot3x;

                auto x = (a1 - a3) * w2;
                a[start + 0 * len + i] = (a0 + a2) + (a1 + a3);
                a[start + 1 * len + i] = (a0 + a2) - (a1 + a3);
                a[start + 2 * len + i] = (a0 - a2) + x;
                a[start + 3 * len + i] = (a0 - a2) - x;
            }
            rotx *= modint8::set1(info.rot_shift8(8 * (start >> h)));
        }
        h -= 2;
    }

    {
        // fft each element
        modint8 rotxi = modint8::set1(1);
        for (int i = 0; i < n; i++) {
            a[i] = fft_single(a[i] * rotxi);
            rotxi *= info.rot_shift16i(16 * i);
        }
    }
}

template <std::ranges::random_access_range R>
    requires is_modint8<std::ranges::range_value_t<R>>::value
void ifft(R&& a) {
    using modint8 = std::ranges::range_value_t<R>;
    static constexpr u32 MOD = modint8::mod();

    static const FFTInfo<MOD>& info = fft_info<MOD>;

    const int n = int(a.size());
    const int lg = std::countr_zero((u32)n);

    {
        // 8-base
        modint8 irotxi = modint8::set1(1);
        for (int i = 0; i < n; i++) {
            a[i] = ifft_single(a[i]) * irotxi;
            irotxi *= info.irot_shift16i(16 * i);
        }
    }

    int h = 0;
    while (h + 2 <= lg) {
        h += 2;

        // 4-base
        static const modint8 w2 = modint8::set1(info.iw[2]);

        modint8 rotx = modint8::set1(1);
        for (int start = 0; start < n; start += (1 << h)) {
            const auto rot2x = rotx * rotx;
            const auto rot3x = rot2x * rotx;
            int len = 1 << (h - 2);
            for (int i = 0; i < len; i++) {
                auto a0 = a[start + 0 * len + i];
                auto a1 = a[start + 1 * len + i];
                auto a2 = a[start + 2 * len + i];
                auto a3 = a[start + 3 * len + i];

                auto x0 = a0 + a1;
                auto x1 = a0 - a1;
                auto x2 = a2 + a3;
                auto x3 = (a2 - a3) * w2;

                a[start + 0 * len + i] = x0 + x2;
                a[start + 1 * len + i] = (x1 + x3) * rotx;
                a[start + 2 * len + i] = (x0 - x2) * rot2x;
                a[start + 3 * len + i] = (x1 - x3) * rot3x;
            }
            rotx *= modint8::set1(info.irot_shift8(8 * (start >> h)));
        }
    }

    if (h + 1 == lg) {
        // 2-base
        int len = n / 2;
        for (int i = 0; i < len; i++) {
            auto l = a[0 * len + i];
            auto r = a[1 * len + i];
            a[0 * len + i] = l + r;
            a[1 * len + i] = l - r;
        }
        h++;
    }
}

}  // namespace fastfps
#line 10 "/home/vscode/fastfps/src/fastfps/modvec.hpp"

namespace fastfps {

template <int MOD> struct ModVec {
    using modint = ModInt<MOD>;
    using modint8 = ModInt8<MOD>;

  public:
    ModVec() : n(0), v() {}
    explicit ModVec(ssize_t _n) : n(_n), v(vsize(_n)) {}
    ModVec(std::initializer_list<u32> li) : n(ssize(li)), v(vsize(n)) {
        auto it = li.begin();
        for (int i = 0; i < ssize(v); i++) {
            std::array<u32, 8> buf = {};
            for (int j = 0; j < 8 && (i * 8 + j) < n; j++) {
                buf[j] = *it;
                it++;
            }
            v[i] = modint8(buf);
        }
    }
    ModVec(std::initializer_list<i32> li) : n(ssize(li)), v(vsize(n)) {
        auto it = li.begin();
        for (int i = 0; i < ssize(v); i++) {
            std::array<i32, 8> buf = {};
            for (int j = 0; j < 8 && (i * 8 + j) < n; j++) {
                buf[j] = *it;
                it++;
            }
            v[i] = modint8(buf);
        }
    }

    ModVec(const std::vector<modint>& _v) : n(std::ssize(_v)), v(vsize(n)) {
        for (int i = 0; i < std::ssize(v); i++) {
            std::array<modint, 8> buf{};
            for (int j = 0; j < 8 && (i * 8 + j) < n; j++) {
                buf[j] = _v[i * 8 + j];
            }
            v[i] = modint8(buf);
        }
    }
    ModVec(const std::vector<u32>& _v) : n(std::ssize(_v)), v(vsize(n)) {
        for (int i = 0; i < std::ssize(v); i++) {
            std::array<u32, 8> buf{};
            for (int j = 0; j < 8 && (i * 8 + j) < n; j++) {
                buf[j] = _v[i * 8 + j];
            }
            v[i] = modint8(buf);
        }
    }

    size_t size() const { return n; }

    std::vector<u32> val() const {
        std::vector<u32> _v(n);
        for (int i = 0; i < std::ssize(v); i++) {
            std::array<u32, 8> buf = v[i].val();
            for (int j = 0; j < 8 && (i * 8 + j) < n; j++) {
                _v[i * 8 + j] = buf[j];
            }
        }
        return _v;
    }
    u32 val(ssize_t index) const {
        if (index < 0 || n <= index) return 0;
        // todo: optimzie
        return v[index / 8].val()[index % 8];
    }

    void resize(ssize_t sz) {
        n = sz;
        v.resize(vsize(n));
        clear_last();
        return;
    }

    ModVec& operator+=(const ModVec& rhs) {
        n = std::max(n, rhs.n);
        if (std::size(v) < std::size(rhs.v)) {
            v.resize(std::size(rhs.v));
        }
        for (int i = 0; i < std::ssize(rhs.v); i++) {
            v[i] += rhs.v[i];
        }
        return *this;
    }
    friend ModVec operator+(const ModVec& lhs, const ModVec& rhs) {
        return ModVec(lhs) += rhs;
    }

    ModVec& operator-=(const ModVec& rhs) {
        n = std::max(n, rhs.n);
        if (std::size(v) < std::size(rhs.v)) {
            v.resize(std::size(rhs.v));
        }
        for (int i = 0; i < std::ssize(rhs.v); i++) {
            v[i] -= rhs.v[i];
        }
        return *this;
    }
    friend ModVec operator-(const ModVec& lhs, const ModVec& rhs) {
        return ModVec(lhs) -= rhs;
    }

    friend bool operator==(const ModVec& lhs, const ModVec& rhs) {
        return lhs.n == rhs.n && lhs.v == rhs.v;
    }

    ModVec& operator*=(const ModVec& rhs) {
        if (n == 0 || rhs.n == 0) {
            n = 0;
            v.clear();
            return *this;
        }
        auto rv = rhs.v;

        n += rhs.n - 1;

        ssize_t v_up = (ssize_t)std::bit_ceil((size_t)vsize(n));
        v.resize(v_up);
        rv.resize(v_up);
        fft(v);
        fft(rv);
        for (int i = 0; i < v_up; i++) {
            v[i] *= rv[i];
        }
        ifft(v);

        v.resize(vsize(n));

        modint8 inv = modint8::set1(modint(8 * v_up).inv());
        for (auto& x : v) x *= inv;
        return *this;
    }
    friend ModVec operator*(const ModVec& lhs, const ModVec& rhs) {
        return ModVec(lhs) *= rhs;
    }

    ModVec& operator*=(const modint& rhs) {
        modint8 r = modint8::set1(rhs);
        for (auto& x : v) x *= r;
        return *this;
    }
    friend ModVec operator*(const ModVec& lhs, const modint& rhs) {
        return ModVec(lhs) *= rhs;
    }
    friend ModVec operator*(const modint& lhs, const ModVec& rhs) {
        return ModVec(rhs) *= lhs;
    }

    // dst[dst_start .. dst_start + len) = this[start .. start + len)
    void copy_to(ssize_t start,
                 ssize_t len,
                 ModVec& dst,
                 ssize_t dst_start) const {
        // TODO: be able to self move
        assert(0 <= start && start + len <= n);
        assert(0 <= dst_start && dst_start + len <= dst.n);
        if (len == 0) return;

        auto succ = [&](ssize_t len2) {
            start += len2;
            dst_start += len2;
            len -= len2;
        };
        if (start % 8 == dst_start % 8) {
            {
                ssize_t len2 = std::min(len, 8 - dst_start % 8);
                const auto mask = [&]() {
                    std::array<u32, 8> b;
                    for (int i = 0; i < 8; i++) {
                        b[i] = (dst_start % 8 <= i && i < dst_start % 8 + len2);
                    }
                    return b;
                }();
                dst.v[dst_start / 8] =
                    blendvar(dst.v[dst_start / 8], v[start / 8], mask);
                succ(len2);
            }
            if (len == 0) return;
            assert(start % 8 == 0 && dst_start % 8 == 0);
            while (len >= 8) {
                // TODO: use std::copy
                dst.v[dst_start / 8] = v[start / 8];
                succ(8);
            }
            if (len == 0) return;
            {
                ssize_t len2 = len;
                const auto mask = [&]() {
                    std::array<u32, 8> b;
                    for (int i = 0; i < 8; i++) {
                        b[i] = (i < len2);
                    }
                    return b;
                }();
                dst.v[dst_start / 8] =
                    blendvar(dst.v[dst_start / 8], v[start / 8], mask);
                succ(len2);
            }
        } else {
            const ssize_t shift = (start + 8 - dst_start % 8) % 8;
            const auto blend_mask = [&]() {
                std::array<u32, 8> b;
                for (int i = 0; i < 8; i++) {
                    b[i] = (8 - shift <= i);
                }
                return b;
            }();
            {
                ssize_t len2 = std::min(len, 8 - dst_start % 8);
                const auto mask = [&]() {
                    std::array<u32, 8> b;
                    for (int i = 0; i < 8; i++) {
                        b[i] = (dst_start % 8 <= i && i < dst_start % 8 + len2);
                    }
                    return b;
                }();
                auto x = v[start / 8].rotate((u32)shift);
                if (len2 > 8 - start % 8) {
                    x = blendvar(x, v[start / 8 + 1].rotate((u32)(shift)),
                                 blend_mask);
                }
                dst.v[dst_start / 8] = blendvar(dst.v[dst_start / 8], x, mask);
                succ(len2);
            }
            if (len == 0) return;

            while (len >= 8) {
                modint8 l = v[start / 8], r = v[start / 8 + 1];
                dst.v[dst_start / 8] = blendvar(
                    l.rotate(u32(shift)), r.rotate(u32(shift)), blend_mask);
                succ(8);
            }
            if (len == 0) return;
            {
                ssize_t len2 = len;
                const auto mask = [&]() {
                    std::array<u32, 8> b = {};
                    for (int i = 0; i < 8; i++) {
                        b[i] = (i < len2);
                    }
                    return b;
                }();
                auto x = v[start / 8].rotate((u32)shift);
                if (len2 > 8 - start % 8) {
                    x = blendvar(x, v[start / 8 + 1].rotate((u32)(shift)),
                                 blend_mask);
                }
                dst.v[dst_start / 8] = blendvar(dst.v[dst_start / 8], x, mask);
                succ(len2);
            }
        }
    }

    ModVec& operator<<=(ssize_t s) {
        n += s;
        if (s % 8 == 0) {
            v.insert(v.begin(), s / 8, modint8());
        } else {
            v.resize(vsize(n));

            const auto mask = [&]() {
                std::array<u32, 8> b;
                for (int i = 0; i < 8; i++) {
                    b[i] = ((s % 8) <= i);
                }
                return b;
            }();
            for (auto i = std::ssize(v) - 1; i >= s / 8 + 1; i--) {
                modint8 l = v[i - 1 - s / 8], r = v[i - s / 8];
                v[i] = blendvar(l.rotate(u32(s % 8)), r.rotate(u32(8 - s % 8)),
                                mask);
            }
            v[s / 8] = blendvar(modint8(), v[0].rotate(u32(8 - s % 8)), mask);
            std::ranges::fill_n(v.begin(), s / 8, modint8());
        }
        return *this;
    }
    friend ModVec operator<<(const ModVec& lhs, ssize_t s) {
        return ModVec(lhs) <<= s;
    }

    ModVec inv(int m) const {
        // TODO: Optimize
        assert(val(0) == 1);
        ModVec res = ModVec({1});
        for (ssize_t i = 1; i < m; i *= 2) {
            ModVec pre(2 * i);
            copy_to(0, std::min(n, 2 * i), pre, 0);
            res = (res * 2 - res * res * pre);
            res.resize(2 * i);
        }
        res.resize(m);
        return res;
    }

    ModVec substr(ssize_t st, ssize_t len) const {
        assert(0 <= st && 0 <= len && st + len <= n);

        ModVec b(len);
        copy_to(st, len, b, 0);
        return b;
    }

    // sum a[i] * b[i]
    friend modint dot(const ModVec& lhs, const ModVec& rhs) {
        modint8 sum;
        for (int i = 0; i < std::min(std::ssize(lhs.v), std::ssize(rhs.v));
             i++) {
            sum += lhs.v[i] * rhs.v[i];
        }
        auto a = sum.val();
        // TODO: optimize
        modint ans;
        for (int i = 0; i < 8; i++) {
            ans += a[i];
        }
        return ans;
    }

    void reverse() {
        auto prev_n = n;
        n = std::ssize(v) * 8;
        std::reverse(v.begin(), v.end());
        for (modint8& x : v) {
            x = x.permutevar({7, 6, 5, 4, 3, 2, 1, 0});
        }

        ModVec tmp(prev_n);
        copy_to(n - prev_n, prev_n, tmp, 0);
        *this = tmp;
    }

    ModVec berlekamp_massey() const {
        ModVec b({-1}), c({-1});
        modint y = 1;
        for (int ed = 1; ed <= n; ed++) {
            int l = int(c.size()), m = int(b.size());
            b.resize(m + 1);
            m++;

            modint x = dot(c, substr(ed - l, l));
            if (x == 0) continue;
            modint freq = x * y.inv();
            if (l < m) {
                // use b
                auto prev_c = c;

                ModVec tmp(m);
                c.copy_to(0, l, tmp, m - l);
                c = tmp;
                c -= freq * b;

                b = prev_c;
                y = x;
            } else {
                // use c

                ModVec tmp(l);
                b.copy_to(0, m, tmp, l - m);

                c -= freq * tmp;
            }
        }
        c.reverse();
        return c;
    }

    friend std::ostream& operator<<(std::ostream& os, const ModVec& r) {
        auto r2 = r.val();

        os << "[";
        for (int i = 0; i < std::ssize(r2); i++) {
            if (i) os << ", ";
            os << r2[i];
        }
        return os << "]";
    }

  private:
    ssize_t n;
    std::vector<modint8> v;

    static ssize_t vsize(ssize_t n) { return (n + 7) / 8; }

    void clear_last() {
        if (n % 8 == 0) return;
        v.back() = blendvar(v.back(), modint8(), [&]() {
            std::array<u32, 8> b;
            for (int i = 0; i < 8; i++) {
                b[i] = ((n % 8) <= i);
            }
            return b;
        }());
    }
};

}  // namespace fastfps
#line 8 "ucup3-13/K/main.cpp"

using namespace yosupo;

using mint = fastfps::ModInt<998244353>;
using mvec = fastfps::ModVec<998244353>;

#line 2 "ucup3-13/K/base.hpp"

#ifdef YOSUPO_AVX2_PRAGMA
#line 5 "ucup3-13/K/base.hpp"
#pragma GCC target("avx2,bmi,bmi2,lzcnt,popcnt")
#endif

#line 11 "ucup3-13/K/base.hpp"
#include <bitset>
#line 13 "ucup3-13/K/base.hpp"
#include <cmath>
#include <cstdio>
#line 17 "ucup3-13/K/base.hpp"
#include <map>
#include <queue>
#line 20 "ucup3-13/K/base.hpp"
#include <set>
#line 22 "ucup3-13/K/base.hpp"
#include <utility>
#line 24 "ucup3-13/K/base.hpp"

using std::abs, std::pow, std::sqrt;
using std::array, std::vector, std::string, std::queue, std::deque;
using std::countl_zero, std::countl_one, std::countr_zero, std::countr_one;
using std::istream, std::ostream, std::cerr, std::endl;
using std::min, std::max, std::swap;
using std::pair, std::tuple, std::bitset;
using std::popcount;
using std::priority_queue, std::set, std::multiset, std::map;
using std::views::iota, std::views::reverse;

namespace ranges = std::ranges;
using ranges::sort, ranges::copy_n;

using uint = unsigned int;
using ll = long long;
using ull = unsigned long long;
constexpr ll TEN(int n) { return (n == 0) ? 1 : 10 * TEN(n - 1); }
template <class T> using V = vector<T>;
template <class T> using VV = V<V<T>>;

#ifdef YOSUPO_LOCAL

inline ostream& operator<<(ostream& os, __int128_t x) {
    if (x < 0) {
        os << "-";
        x *= -1;
    }
    if (x == 0) {
        return os << "0";
    }
    string s;
    while (x) {
        s += char(x % 10 + '0');
        x /= 10;
    }
    ranges::reverse(s);
    return os << s;
}
inline ostream& operator<<(ostream& os, __uint128_t x) {
    if (x == 0) {
        return os << "0";
    }
    string s;
    while (x) {
        s += char(x % 10 + '0');
        x /= 10;
    }
    ranges::reverse(s);
    return os << s;
}

template <class T, class U>
ostream& operator<<(ostream& os, const pair<T, U>& p);
template <class T> ostream& operator<<(ostream& os, const V<T>& v);
template <class T> ostream& operator<<(ostream& os, const deque<T>& v);
template <class T, size_t N>
ostream& operator<<(ostream& os, const array<T, N>& a);
template <class T> ostream& operator<<(ostream& os, const set<T>& s);
template <class T, class U>
ostream& operator<<(ostream& os, const map<T, U>& m);

template <class T, class U>
ostream& operator<<(ostream& os, const pair<T, U>& p) {
    return os << "P(" << p.first << ", " << p.second << ")";
}

template <class T> ostream& operator<<(ostream& os, const V<T>& v) {
    os << "[";
    bool f = false;
    for (auto d : v) {
        if (f) os << ", ";
        f = true;
        os << d;
    }
    return os << "]";
}

template <class T> ostream& operator<<(ostream& os, const deque<T>& v) {
    os << "[";
    bool f = false;
    for (auto d : v) {
        if (f) os << ", ";
        f = true;
        os << d;
    }
    return os << "]";
}
template <class T, size_t N>
ostream& operator<<(ostream& os, const array<T, N>& a) {
    os << "[";
    bool f = false;
    for (auto d : a) {
        if (f) os << ", ";
        f = true;
        os << d;
    }
    return os << "]";
}

template <class T> ostream& operator<<(ostream& os, const set<T>& s) {
    os << "{";
    bool f = false;
    for (auto d : s) {
        if (f) os << ", ";
        f = true;
        os << d;
    }
    return os << "}";
}
template <class T> ostream& operator<<(ostream& os, const multiset<T>& s) {
    os << "{";
    bool f = false;
    for (auto d : s) {
        if (f) os << ", ";
        f = true;
        os << d;
    }
    return os << "}";
}

template <class T, class U>
ostream& operator<<(ostream& os, const map<T, U>& s) {
    os << "{";
    bool f = false;
    for (auto p : s) {
        if (f) os << ", ";
        f = true;
        os << p.first << ": " << p.second;
    }
    return os << "}";
}

struct PrettyOS {
    ostream& os;
    bool first;

    template <class T> auto operator<<(T&& x) {
        if (!first) os << ", ";
        first = false;
        os << x;
        return *this;
    }
};
template <class... T> void dbg0(T&&... t) {
    (PrettyOS{cerr, true} << ... << t);
}
#define dbg(...)                                            \
    do {                                                    \
        cerr << __LINE__ << " : " << #__VA_ARGS__ << " = "; \
        dbg0(__VA_ARGS__);                                  \
        cerr << endl;                                       \
    } while (false);
#else
#define dbg(...)
#endif
#line 15 "ucup3-13/K/main.cpp"

Scanner sc = Scanner(stdin);
Printer pr = Printer(stdout);

const int MX = 8003;

V<mvec> left(MX), right(MX);

void init() {
    {
        V<mint> buf(MX);
        for (int i : iota(0, MX)) {
            buf[i] = (i % 2 ? -1 : 1);
        }
        for (int N : iota(1, MX)) {
            for (int i : iota(0, MX)) {
                buf[i] *= i;
            }
            left[N] = mvec(buf);
        }
    }
    {
        VV<mint> comb(MX, V<mint>(MX));
        comb[0][0] = 1;
        for (int i : iota(1, MX)) {
            comb[i][0] = 1;
            for (int j : iota(1, i + 1)) {
                comb[i][j] = comb[i - 1][j - 1] + comb[i - 1][j];
            }
        }

        for (int M : iota(1, MX - 1)) {
            comb[M + 1].resize(M + 1);
            right[M] = mvec(comb[M + 1]);
        }
    }
}


mint fast(int N, int M) {
    mint sum = dot(left[N], right[M]);
    sum *= mint(-1).pow(M);
    sum *= mint(M).pow(N).inv();
    sum -= 1;
    return sum;
}

int main() {
    init();

    int T;
    sc.read(T);

    for (int _ : iota(0, T)) {
        int N, M;
        sc.read(N, M);
        // N = uniform(1, 8000);
        // M = uniform(1, 8000);

        mint ans = fast(N, M);
        pr.writeln(ans.val());
    }

    return 0;
}

Details

Tip: Click on the bar to expand more detailed information

Test #1:

score: 100
Accepted
time: 230ms
memory: 629920kb

input:

4
3 2
1 1
20 23
8000 8000

output:

374341634
1
111675632
994279778

result:

ok 4 tokens

Test #2:

score: 0
Accepted
time: 227ms
memory: 629868kb

input:

5
60 26
33 95
18 89
82 12
77 36

output:

945602338
254913692
403396795
820508695
360125985

result:

ok 5 tokens

Test #3:

score: 0
Accepted
time: 243ms
memory: 629884kb

input:

5
23 13
95 8
73 19
72 74
23 51

output:

788774542
935467825
483603650
274447212
738760583

result:

ok 5 tokens

Test #4:

score: 0
Accepted
time: 240ms
memory: 629760kb

input:

5
7 79
47 12
64 29
23 59
88 21

output:

238359778
424364643
993714623
760177301
865871793

result:

ok 5 tokens

Test #5:

score: 0
Accepted
time: 252ms
memory: 629680kb

input:

5
39 47
22 33
2 58
43 45
32 67

output:

68068469
21035974
735626561
965644028
137192045

result:

ok 5 tokens

Test #6:

score: 0
Accepted
time: 255ms
memory: 629652kb

input:

5
57 73
20 64
18 72
56 64
9 58

output:

218207240
814770590
121270366
636721674
420274847

result:

ok 5 tokens

Test #7:

score: 0
Accepted
time: 232ms
memory: 629936kb

input:

5
100 100
100 99
99 100
98 99
99 97

output:

585389012
131732771
619127511
549657738
490584077

result:

ok 5 tokens

Test #8:

score: 0
Accepted
time: 260ms
memory: 629644kb

input:

1922
4663 5021
7459 306
3249 6943
4902 4260
6118 5364
4997 7021
6772 3346
3916 7327
7156 4792
1228 5381
3240 7026
131 5713
1120 5334
2186 610
7638 2846
891 6274
5363 426
1335 7417
2127 396
323 7781
5435 1922
4989 5238
2886 3788
5413 1384
7624 4245
7191 6758
7755 5835
7660 1787
1043 7586
803 7889
79 ...

output:

672342508
406758717
456109836
583347519
254351863
547587964
177045319
935533988
555369350
136991350
790497273
429246740
670208582
782070778
169184793
771435402
251034885
528072506
303570823
257245963
629853925
267752975
350150586
786769060
44222606
607226242
320315817
861879910
752261031
341472947
2...

result:

ok 1922 tokens

Test #9:

score: 0
Accepted
time: 247ms
memory: 629924kb

input:

1569
1690 3118
4489 1453
6866 3161
6664 1290
2600 7962
6689 4642
522 772
2162 4794
3190 5987
3327 4938
6130 3823
6941 5425
3091 6213
3025 388
5330 3690
3161 6492
1740 5873
5530 1458
2496 6781
6287 5635
662 3877
3505 5138
2511 2028
3500 859
7572 813
2520 3943
7377 4768
6158 1882
7427 1702
4296 5159
5...

output:

786392950
680031668
677629004
801851613
786349751
79816839
959519914
318092993
339917671
724667845
890615671
100962701
589915015
941504560
820459949
486565344
823734064
220460851
576680186
554430485
361102164
218914963
840663949
777667686
736007308
919520675
863371619
66677855
637862969
67422276
384...

result:

ok 1569 tokens

Test #10:

score: 0
Accepted
time: 215ms
memory: 629656kb

input:

1181
4017 5052
5241 7494
7719 3875
7903 143
7280 2239
6098 2785
4900 5047
3542 4892
3011 430
4358 3184
1473 1501
2732 5656
6806 7106
6079 4418
4893 233
1746 3558
3801 650
4506 970
7836 5225
1970 1822
3342 7672
3519 1017
6258 3172
6871 3994
4143 3721
1752 2936
5806 2553
1727 3701
6464 2302
2048 3091
...

output:

648881231
526073149
469264135
392921762
374237236
765018788
699026377
457948355
693169225
754094043
700515631
122741833
428610910
661965148
268857241
313001621
686530925
177273994
339148514
571456944
973936686
176745436
23414882
360870357
623038194
895354617
386646311
288047747
236022755
955017813
1...

result:

ok 1181 tokens

Test #11:

score: 0
Accepted
time: 214ms
memory: 629676kb

input:

1080
7499 4465
5556 2341
808 1986
3404 6901
4609 4168
235 5744
5131 7261
6616 1993
4624 3943
5843 6392
4889 2743
386 6670
1188 23
4216 4225
1193 1295
6097 4160
710 2728
7146 4193
5425 4148
6206 7462
7147 1808
2381 1254
4193 1297
1359 233
991 6979
5009 6963
1824 2135
1078 6208
2893 5858
320 4173
4937...

output:

584491148
616649457
512306930
528213999
550156793
344729669
779502829
828764040
365090398
371482124
273983459
617971432
137019685
400487464
761520033
143391408
908639433
294086517
926654429
723576006
993426946
572674399
178336952
402120004
148856064
897242602
390050708
850225145
605879501
962941650
...

result:

ok 1080 tokens

Test #12:

score: 0
Accepted
time: 219ms
memory: 629928kb

input:

1534
2137 7885
2676 2513
53 3021
1623 5195
660 4999
2881 7697
6034 6429
4724 4014
5986 266
7826 726
4086 6628
7498 6114
4801 4415
5037 4206
700 6054
3497 476
1715 5892
6009 6340
1251 2345
2819 4107
7544 864
3138 4179
3909 912
180 4496
4727 2930
1057 7077
4123 2560
4963 4100
7118 463
2945 935
6573 41...

output:

676937061
816416208
899106800
778722088
621854770
637694747
789726622
647248717
143759992
290955099
204045987
17260543
508242895
836696138
605720517
462338702
426815143
443255417
341689094
660082176
461660684
531200268
467927798
816405934
307396775
786033585
765478425
774747686
67909522
155061063
47...

result:

ok 1534 tokens

Test #13:

score: 0
Accepted
time: 1110ms
memory: 629876kb

input:

300000
1983 855
7767 4477
6925 7526
7306 5358
3987 46
5716 3789
4487 4391
4358 7525
933 1015
953 546
5716 5487
968 6561
2932 6558
6796 1429
4864 4211
5955 4414
6657 5171
2784 3725
1139 7304
553 3163
7248 6772
1977 6216
4701 7267
6130 4055
5688 1364
1335 4326
2633 3945
7851 5521
6474 2532
6869 5201
2...

output:

917986185
514093688
240004856
10138263
106086887
486293160
462563200
380236329
178495199
768072852
293049871
679765965
19413063
914310451
303877752
97576016
551398628
294935753
497649688
625770227
916721949
945723005
793837895
598750153
811171822
281042931
224310375
229099648
232754408
173968951
334...

result:

ok 300000 tokens

Test #14:

score: 0
Accepted
time: 1132ms
memory: 629932kb

input:

300000
6276 3969
1337 287
69 4971
4553 4420
4304 107
836 5154
7039 7495
4074 5597
3321 6214
5997 5958
1357 67
5347 5263
5228 5204
6067 7567
3498 226
1830 3989
7897 3908
4547 714
1973 4138
3392 2046
6781 2623
7423 7027
3219 1631
688 6768
1270 5667
1911 1106
4914 755
4060 6194
5588 6416
5379 3593
4950...

output:

785609765
389521714
617648697
133397962
663080285
932116327
864145458
250419436
926868327
231968290
706343931
34357834
259117474
30429506
802394434
962282557
421143424
325071266
930611818
413209658
588520237
879895836
293550595
779472804
703506662
997419552
167326709
571013401
948481475
873418350
52...

result:

ok 300000 tokens

Test #15:

score: 0
Accepted
time: 1097ms
memory: 629936kb

input:

300000
172 7671
2377 1841
772 2572
897 2774
7862 7766
563 7835
50 5627
3975 332
3125 4092
6642 7913
377 4237
5378 2346
7235 484
7254 4026
5032 189
698 3244
5656 1277
42 5418
294 7339
6054 5619
5273 6487
3381 4739
1652 5241
5455 6606
5194 1556
2248 5307
6266 94
6669 4982
4033 4379
6666 4863
7785 583
...

output:

690315780
651031191
910258157
142140073
777756320
339555304
856925271
481764268
804784924
892959827
162363106
880216583
28750709
919204633
590976688
235862971
115143352
552437269
440186544
342438715
203287097
208201535
473851494
630433067
795957931
121121486
655185544
120192487
18559533
512410924
14...

result:

ok 300000 tokens

Test #16:

score: 0
Accepted
time: 1061ms
memory: 629896kb

input:

300000
7687 5348
7170 7128
1126 3094
1811 2132
4535 2558
6168 62
1913 315
454 6832
2620 979
6268 2470
7745 4962
5836 455
2548 2645
1190 4820
1664 7069
1853 3559
1684 324
2964 2375
6535 2140
5793 6520
2089 2949
6810 6376
3938 1105
3321 2276
1764 7871
7238 4463
6621 6709
4794 1247
1193 3711
7945 25
75...

output:

467980791
680962696
898655348
87851601
574364215
617075952
975724718
232344677
97747094
798035755
544312119
750213987
398352588
468271115
911224185
789740750
889993565
757589351
219602000
508186836
143616463
496959998
957512294
48894767
747840016
237688107
834496842
452902067
436640761
68924558
4766...

result:

ok 300000 tokens

Test #17:

score: 0
Accepted
time: 1085ms
memory: 629828kb

input:

300000
3651 4395
598 2124
7806 1885
6102 3232
1632 4425
2814 2949
2885 4010
719 5821
945 382
3259 3899
1193 2658
3681 176
6978 3339
5065 458
7910 7330
7480 2560
1144 4193
3047 5955
690 5384
6928 5609
238 904
6819 6617
2297 2464
1956 4427
3070 7665
57 5624
1382 7277
1510 931
5413 6319
4135 5153
1245 ...

output:

185080421
622515437
953285449
259657392
382766568
389748070
912098350
791812015
122470478
542646121
189378193
481103802
38378800
282397881
456885301
463133196
542482622
956189657
306447176
892824103
231973605
607936904
612962412
787715604
946988413
397452805
443819486
441909715
443478773
675662739
2...

result:

ok 300000 tokens

Test #18:

score: 0
Accepted
time: 750ms
memory: 629844kb

input:

300000
5511 1592
3091 222
3042 2846
4996 1848
2759 719
339 41
7833 6657
6578 4870
5836 3918
3287 2592
6888 254
323 257
3894 762
2781 147
6338 4197
2401 5526
309 111
499 475
68 1
1791 1498
1139 172
7367 5346
1326 1086
6056 3244
1539 870
2161 577
6899 4934
3222 2409
5094 4945
1252 389
7532 3877
4849 2...

output:

308162096
926831023
97466439
381502673
879141892
288558285
376988538
114780505
967786299
109837829
456357766
152648543
358087181
727740397
203822224
512742419
592251017
205442121
1
187347956
440265112
31975034
944117166
277099223
807372439
313788153
396485979
416038692
118014328
380422322
384451082
...

result:

ok 300000 tokens

Test #19:

score: 0
Accepted
time: 726ms
memory: 629892kb

input:

300000
5511 2811
3091 225
3042 1281
4996 821
2759 267
339 292
7833 515
6578 5344
5836 1128
3287 398
6888 5910
323 266
3894 3721
2781 2271
6338 5322
6838 6497
309 243
499 486
68 11
1791 100
1139 514
7367 5113
1326 747
6056 1604
1539 782
2161 762
6899 4749
3222 2011
5094 3978
1252 623
7532 5477
4849 4...

output:

665054891
300867667
348283279
466053547
45744379
708735980
593404766
831832507
489279444
573407999
597639718
5766230
375599902
486548670
501927978
980593373
969955705
448325802
388400601
262385137
375376816
110122988
737706874
150359153
575621812
804184716
68665586
818047613
692689346
78602127
45512...

result:

ok 300000 tokens

Test #20:

score: 0
Accepted
time: 713ms
memory: 629928kb

input:

300000
5511 413
3091 2856
3042 1024
4996 3213
2759 105
339 327
7833 5988
6578 1636
5836 315
3287 1972
6888 1326
323 60
3894 816
2781 1712
6338 4382
2852 7641
309 57
499 167
68 23
1791 1375
1139 348
7367 6505
1326 435
6056 4617
1539 1133
2161 910
6899 1763
3222 1481
5094 2477
1252 1156
7532 6557
4849...

output:

485659367
677896371
51153808
69443182
412971885
818481416
849977792
331829138
55724792
462907888
637926
406804012
381350405
51624478
359208029
272155650
163436382
342656855
200714626
498916202
182274510
677459983
991151110
396383019
392439555
63570810
520284517
966012692
88444228
86200285
555967449
...

result:

ok 300000 tokens

Test #21:

score: 0
Accepted
time: 706ms
memory: 629840kb

input:

300000
5511 2520
3091 2007
3042 2527
4996 267
2759 1311
339 7
7833 5969
6578 5180
5836 4504
3287 824
6888 1800
323 188
3894 2703
2781 113
6338 5373
210 667
309 5
499 463
68 45
1791 1776
1139 217
7367 6534
1326 193
6056 4824
1539 64
2161 626
6899 2131
3222 2304
5094 908
1252 622
7532 571
4849 1266
15...

output:

476330360
341129155
87686760
780287663
27737410
601067754
621911465
112461167
976022023
494331271
75971592
561865913
585445560
580978232
272409206
301199669
509769247
189882720
370830663
729977839
290413155
663712832
115843838
947770059
572260971
688396109
806982866
335384041
666428123
733355123
403...

result:

ok 300000 tokens

Test #22:

score: 0
Accepted
time: 740ms
memory: 629936kb

input:

300000
5511 2723
3091 2210
3042 1678
4996 3350
2759 1717
339 59
7833 6785
6578 1468
5836 5509
3287 2451
6888 4895
323 38
3894 2668
2781 2757
6338 5735
139 3773
309 296
499 359
68 51
1791 681
1139 990
7367 745
1326 327
6056 4864
1539 1125
2161 808
6899 890
3222 1023
5094 818
1252 185
7532 1083
4849 1...

output:

122256708
329468041
972582618
696900189
185355879
798415905
911105222
943525716
635145786
793642508
954014637
300072137
198622306
632297009
788106407
790602929
474908621
312319885
494386936
195749245
997359493
881353961
668060322
157183412
32778140
733123188
104542588
116382314
860154073
47295
78564...

result:

ok 300000 tokens

Test #23:

score: 0
Accepted
time: 1072ms
memory: 629652kb

input:

300000
7522 7956
7746 7848
7995 7694
7479 7992
7878 7976
7532 7658
7679 7755
7462 7709
7610 7495
7877 7995
7915 7608
7883 7677
7467 7658
7615 7815
7521 7676
7455 7891
7868 7896
7634 7704
7869 7590
7471 7573
7472 7678
7885 7539
7983 7974
7478 7479
7705 7827
7675 7615
7915 7597
7644 7511
7903 7966
750...

output:

350858640
985201186
270505812
117456150
344107653
461416294
951152728
812878714
422195931
502806704
124570242
713987345
272798186
110562310
722669359
200627964
808703774
749707180
560860878
63011161
961348423
407734207
629246603
741475119
234863886
992855605
920110738
57955523
124147954
685852042
92...

result:

ok 300000 tokens

Extra Test:

score: 0
Extra Test Passed