test/yukicoder/1145.test.cpp

View this file on GitHub
Last update: 2025-09-09 22:49:44+09:00
Problem: https://yukicoder.me/problems/no/1145

Depends on

Code

// competitive-verifier: PROBLEM https://yukicoder.me/problems/no/1145
#include "../../poly/sum-of-powers.hpp"
#include "../../template.hpp"
#include <atcoder/modint>
using mint = atcoder::modint998244353;
void solve() {
    INT(n, m);
    vector<mint> a(n);
    rep(i, n) {
        INT(ai);
        a[i] = ai;
    }
    auto f = sum_of_powers(a, m);
    rep(i, 1, m + 1) cout << f[i].val() << " \n"[i == m];
}
int main() {
    cin.tie(nullptr);
    ios::sync_with_stdio(false);
    solve();
}

#line 1 "test/yukicoder/1145.test.cpp"
// competitive-verifier: PROBLEM https://yukicoder.me/problems/no/1145
#line 2 "other/fastio.hpp"
// ref: https://maspypy.com/library-checker-many-a-b , Nyaanさん
#line 2 "other/type-utils.hpp"
#include <bits/stdc++.h>
using ll = long long;
using u32 = unsigned int;
using u64 = unsigned long long;
using i128 = __int128;
using u128 = unsigned __int128;
using vi = std::vector<int>;
using vii = std::vector<std::vector<int>>;
using pii = std::pair<int, int>;
using vl = std::vector<ll>;
using vll = std::vector<vl>;
using pll = std::pair<ll, ll>;

template <class T>
concept extended_integral =
    std::integral<T> || std::same_as<std::remove_cv_t<T>, i128> ||
    std::same_as<std::remove_cv_t<T>, u128>;
template <class T>
concept extended_signed_integral =
    std::signed_integral<T> || std::same_as<std::remove_cv_t<T>, i128>;
template <class T>
concept extended_unsigned_integral =
    std::unsigned_integral<T> || std::same_as<std::remove_cv_t<T>, u128>;

template <class T>
concept Streamable =
    requires(std::ostream &os, T &x) { os << x; } || extended_integral<T>;
template <class mint>
concept is_modint = requires(mint &x) {
    { x.val() } -> std::convertible_to<int>;
};
#line 4 "other/fastio.hpp"
namespace fastio {
constexpr int SZ = 1 << 17;
constexpr int offset = 64;
constexpr int mod = 10000;
char in_buf[SZ];
int in_left{}, in_right{};
char out_buf[SZ];
char out_tmp[offset];
int out_right{};
struct Pre {
    char num[4 * mod]{};
    constexpr Pre() {
        for(int i = 0; i < mod; ++i) {
            for(int n = i, j = 3; j >= 0; --j, n /= 10)
                num[4 * i + j] = '0' + n % 10;
        }
    }
    constexpr const char *operator[](int i) const { return &num[4 * i]; }
} constexpr pre;
void load() {
    memmove(in_buf, in_buf + in_left, in_right - in_left);
    in_right += -in_left + std::fread(in_buf + in_right - in_left, 1,
                                      SZ - (in_right - in_left), stdin);
    in_left = 0;
    if(in_right < SZ)
        in_buf[in_right++] = '\n';
}
void read(char &c) {
    do {
        if(in_left == in_right)
            load();
        c = in_buf[in_left++];
    } while(isspace(c));
}
void read(std::string &s) {
    s.clear();
    char c;
    do {
        if(in_left == in_right)
            load();
        c = in_buf[in_left++];
    } while(isspace(c));
    do {
        s += c;
        if(in_left == in_right)
            load();
        c = in_buf[in_left++];
    } while(!isspace(c));
}
template <extended_integral T> void read(T &x) {
    if(in_right - in_left < offset)
        load();
    char c;
    do
        c = in_buf[in_left++];
    while(c < '-'); // \n:10 space:32 -:45 '0':48
    bool minus{};
    if constexpr(extended_signed_integral<T>) {
        if(c == '-') {
            c = in_buf[in_left++];
            minus = true;
        }
    }
    x = 0;
    while(c >= '0') {
        x = 10 * x + (c & 15);
        c = in_buf[in_left++];
    }
    if constexpr(extended_signed_integral<T>) {
        if(minus)
            x = -x;
    }
}
void flush() { fwrite(out_buf, 1, std::exchange(out_right, 0), stdout); }
void write_range(const char *c, int n) {
    int pos{};
    while(pos < n) {
        if(out_right == SZ)
            flush();
        int len = std::min(n - pos, SZ - out_right);
        memcpy(out_buf + out_right, c + pos, len);
        out_right += len;
        pos += len;
    }
}

void write(char c) {
    if(SZ == out_right)
        flush();
    out_buf[out_right++] = c;
}
void write(const char *c) { write_range(c, strlen(c)); }
void write(const std::string &s) { write_range(s.data(), s.size()); }
template <std::floating_point T> void write(T x) {
    int n = std::snprintf(out_tmp, sizeof(out_tmp), "%.16g", x);
    write_range(out_tmp, n);
}
void write(bool x) { write(x ? '1' : '0'); }
template <extended_integral T> void write(T x) {
    if(x == 0) {
        write('0');
    }
    if constexpr(extended_signed_integral<T>) {
        if(x < 0) {
            write('-');
            x = -x;
        }
    }
    if(SZ - out_right < offset)
        flush();
    int cur = offset;
    for(; x >= 1000; x /= mod) {
        cur -= 4;
        memcpy(out_tmp + cur, pre[x % mod], 4);
    }
    if(x >= 100) {
        cur -= 3;
        memcpy(out_tmp + cur, pre[x % mod] + 1, 3);
    } else if(x >= 10) {
        cur -= 2;
        memcpy(out_tmp + cur, pre[x % mod] + 2, 2);
    } else if(x >= 1) {
        cur -= 1;
        memcpy(out_tmp + cur, pre[x % mod] + 3, 1);
    }
    write_range(out_tmp + cur, offset - cur);
}
struct Dummy {
    // プログラム終了時に出力
    ~Dummy() { flush(); }
} dummy;
} // namespace fastio
using fastio::write;
#line 4 "template.hpp"
// #pragma GCC target("avx2")
// #pragma GCC optimize("O3")
// #pragma GCC optimize("unroll-loops")
#line 8 "template.hpp"
using namespace std;
#ifdef LOCAL
#include <debug.hpp>
#else
#define debug(...)
#endif
template <Streamable T> void print_one(const T &value) { fastio::write(value); }
template <is_modint T> void print_one(const T &value) {
    print_one(value.val());
}
void print() { print_one('\n'); }
template <class T, class... Ts> void print(const T &a, const Ts &...b) {
    print_one(a);
    ((print_one(' '), print_one(b)), ...);
    print();
}
template <ranges::range Iterable>
    requires(!Streamable<Iterable>)
void print(const Iterable &v) {
    for(auto it = v.begin(); it != v.end(); ++it) {
        if(it != v.begin())
            print_one(' ');
        print_one(*it);
    }
    print();
}
#define all(v) begin(v), end(v)
template <class T> void UNIQUE(T &v) {
    ranges::sort(v);
    v.erase(unique(all(v)), end(v));
}
template <typename T> inline bool chmax(T &a, T b) {
    return ((a < b) ? (a = b, true) : (false));
}
template <typename T> inline bool chmin(T &a, T b) {
    return ((a > b) ? (a = b, true) : (false));
}
// https://trap.jp/post/1224/
template <class... T> constexpr auto min(T... a) {
    return min(initializer_list<common_type_t<T...>>{a...});
}
template <class... T> constexpr auto max(T... a) {
    return max(initializer_list<common_type_t<T...>>{a...});
}
void input() {}
template <class Head, class... Tail> void input(Head &head, Tail &...tail) {
#ifdef LOCAL
    cin >> head;
#else
    fastio::read(head);
#endif
    input(tail...);
}
template <class T> void input(vector<T> &a) {
    for(T &x : a)
        input(x);
}
#define INT(...)                                                               \
    int __VA_ARGS__;                                                           \
    input(__VA_ARGS__)
#define LL(...)                                                                \
    long long __VA_ARGS__;                                                     \
    input(__VA_ARGS__)
#define STR(...)                                                               \
    string __VA_ARGS__;                                                        \
    input(__VA_ARGS__)
#define REP1_0(n, c) REP1_1(n, c)
#define REP1_1(n, c)                                                           \
    for(ll REP_COUNTER_##c = 0; REP_COUNTER_##c < (ll)(n); REP_COUNTER_##c++)
#define REP1(n) REP1_0(n, __COUNTER__)
#define REP2(i, a) for(ll i = 0; i < (ll)(a); i++)
#define REP3(i, a, b) for(ll i = (ll)(a); i < (ll)(b); i++)
#define REP4(i, a, b, c) for(ll i = (ll)(a); i < (ll)(b); i += (ll)(c))
#define overload4(a, b, c, d, e, ...) e
#define rep(...) overload4(__VA_ARGS__, REP4, REP3, REP2, REP1)(__VA_ARGS__)
ll inf = 3e18;
vl dx = {1, -1, 0, 0};
vl dy = {0, 0, 1, -1};
template <class T> constexpr T floor(T x, T y) noexcept {
    return x / y - ((x ^ y) < 0 and x % y);
}
template <class T> constexpr T ceil(T x, T y) noexcept {
    return x / y + ((x ^ y) >= 0 and x % y);
}
// yの符号に関わらず非負で定義 \bmod:texコマンド
template <class T> constexpr T bmod(T x, T y) noexcept {
    T m = x % y;
    return (m < 0) ? m + (y > 0 ? y : -y) : m;
}
template <std::signed_integral T> constexpr int bit_width(T x) noexcept {
    return std::bit_width((uint64_t)x);
}
template <std::signed_integral T> constexpr int popcount(T x) noexcept {
    return std::popcount((uint64_t)x);
}
constexpr bool kth_bit(auto n, auto k) { return (n >> k) & 1; }
#line 3 "poly/formal-power-series.hpp"
#include <atcoder/convolution>
// 10^9+7みたいなときconvolutionどうする？
template <class mint> struct FormalPowerSeries : vector<mint> {
    using vector<mint>::vector;
    using FPS = FormalPowerSeries;
    FormalPowerSeries(const vector<mint> &v) : vector<mint>(v) {}
    FPS &operator+=(const FPS &f) {
        if(this->size() < f.size())
            this->resize(f.size());
        for(int i = 0; i < ssize(f); ++i)
            (*this)[i] += f[i];
        return *this;
    }
    FPS &operator-=(const FPS &f) {
        if(this->size() < f.size())
            this->resize(f.size());
        for(int i = 0; i < ssize(f); ++i)
            (*this)[i] -= f[i];
        return *this;
    }
    FPS &operator*=(const FPS &f) {
        if constexpr(is_same_v<mint, long long>) {
            return (*this) = atcoder::convolution_ll(*this, f);
        } else {
            return (*this) = atcoder::convolution(*this, f);
        }
    }
    FPS &operator*=(const mint &x) {
        for(mint &vi : *this)
            vi *= x;
        return *this;
    }
    FPS operator+(const FPS &f) const { return FPS(*this) += f; }
    FPS operator-(const FPS &f) const { return FPS(*this) -= f; }
    FPS operator*(const FPS &f) const { return FPS(*this) *= f; }
    FPS operator*(const mint &x) const { return FPS(*this) *= x; }
    FPS operator-() const {
        FPS res = *this;
        for(mint &vi : res) {
            vi = -vi;
        }
        return res;
    }
    FPS operator>>(const int sz) const {
        if(sz >= ssize(*this))
            return {};
        FPS res(begin(*this) + sz, end(*this));
        return res;
    }
    FPS operator<<(const int sz) const {
        FPS res(sz, 0);
        res.insert(end(res), begin(*this), end(*this));
        return res;
    }
    FPS inv(int deg = -1) const {
        assert(!this->empty() and (*this)[0] != mint(0));
        if(deg == -1)
            deg = this->size();
        FPS res = {(*this)[0].inv()};
        FPS f;
        f.reserve(this->size());
        for(int d = 1; d < deg << 1; d <<= 1) {
            while(ssize(f) < min(ssize(*this), d))
                f.emplace_back((*this)[f.size()]);
            res *= (FPS({2}) - f * res);
            while(ssize(res) > min(d, deg))
                res.pop_back();
        }
        return res;
    }
    // なければ空を返す
    // 定数項が1でないときget_sqrtを渡す。解が複数ありうることに注意
    FPS sqrt(
        int deg = -1,
        function<mint(mint)> get_sqrt = [](mint) { return mint(1); }) const {
        if(this->empty())
            return {};
        if(deg == -1)
            deg = this->size();
        if((*this)[0] == mint(0)) {
            for(int i = 1; i < ssize(*this); ++i) {
                if((*this)[i] == mint(0))
                    continue;
                if(i & 1)
                    return {};
                if(i / 2 >= deg)
                    break;
                FPS res = (*this >> i).sqrt(deg - i / 2, get_sqrt);
                if(res.empty())
                    return {};
                res = res << (i / 2);
                return res;
            }
            return FPS(deg, 0);
        }
        FPS res{get_sqrt((*this)[0])};
        if(res[0] * res[0] != (*this)[0])
            return {};
        FPS f;
        f.reserve(this->size());
        mint inv2 = mint(1) / mint(2);
        for(int d = 1; d < deg << 1; d <<= 1) {
            while(ssize(f) < min(ssize(*this), d))
                f.emplace_back((*this)[f.size()]);
            res = (res + f * res.inv(d)) * inv2;
            while(ssize(res) > min(d, deg))
                res.pop_back();
        }
        return res;
    }
    FPS diff() const {
        FPS res(max<int>(0, ssize(*this) - 1));
        for(int i = 1; i < ssize(*this); ++i)
            res[i - 1] = (mint)i * (*this)[i];
        return res;
    }
    FPS integral() const {
        FPS res(ssize(*this) + 1);
        for(int i = 0; i < ssize(*this); ++i)
            res[i + 1] = (*this)[i] / mint(i + 1);
        return res;
    }
    FPS log(int deg = -1) const {
        assert(!this->empty() and (*this)[0] == (mint)1);
        if(deg == -1)
            deg = this->size();
        if(deg == 0)
            return {};
        FPS t(begin(*this), begin(*this) + min<int>(deg, ssize(*this)));
        FPS res = t.diff() * t.inv(deg - 1);
        res.resize(deg - 1);
        return res.integral();
    }
    FPS exp(int deg = -1) {
        assert(!this->empty() and (*this)[0] == (mint)0);
        if(deg == -1)
            deg = this->size();
        if(deg == 0)
            return {};
        FPS res = {1};
        FPS f;
        f.reserve(this->size());
        for(int d = 1; d < deg << 1; d <<= 1) {
            while(ssize(f) < min(ssize(*this), d))
                f.emplace_back((*this)[f.size()]);
            res *= (FPS({1}) + f - res.log(d));
            while(ssize(res) > min(d, deg))
                res.pop_back();
        }
        return res;
    }
};
#line 3 "poly/sum-of-powers.hpp"
/**
 * @brief 冪乗和の列挙
 * @see https://yukicoder.me/problems/no/1145/editorial
 * @see https://maspypy.com/多項式・形式的べき級数-高速に計算できるもの#toc19
 * @see https://maspypy.com/多項式・形式的べき級数-高速に計算できるもの#toc34
 */
/// 各i(0≦i≦k)についてsum[j]a_j^iを求め、長さk+1の列を返す
/// O(n*log(n)^2 + k*log(k))時間
template <class mint> vector<mint> sum_of_powers(const vector<mint> &a, int k) {
    if(a.empty())
        return vector<mint>(k + 1, 0);
    queue<FormalPowerSeries<mint>> que;
    for(auto &ai : a)
        que.push({1, -ai});
    while(que.size() > 1) {
        auto f = que.front();
        que.pop();
        auto g = que.front();
        que.pop();
        que.push(f * g);
    }
    auto &f = que.front();
    f = f.log(k + 1);
    for(int i = 1; i <= k; ++i)
        f[i] = -f[i] * mint(i);
    f[0] = ssize(a);
    return f;
}
/// 各i(0≦i≦k)についてsum[j in (0,n]]j^iを求め、長さk+1の列を返す
/// O(k*log(k))時間
template <class mint> vector<mint> sum_of_powers_iota(int n, int k) {
    using FPS = FormalPowerSeries<mint>;
    FPS num(k + 1, 1), den(k + 1, 1);
    mint fac = 1, npow = n;
    for(int i = 0; i <= k; ++i, npow *= n) {
        num[i] *= npow;
        fac *= i + 1;
    }
    fac = mint(1) / fac;
    for(int i = k; i >= 0; --i) {
        num[i] *= fac;
        den[i] *= fac;
        fac *= i + 1;
    }
    FPS res = num * den.inv(k + 1);
    res.resize(k + 1);
    fac = 1;
    for(int i = 0; i <= k; ++i) {
        res[i] *= fac;
        fac *= i + 1;
    }
    return res;
}
#line 4 "test/yukicoder/1145.test.cpp"
#include <atcoder/modint>
using mint = atcoder::modint998244353;
void solve() {
    INT(n, m);
    vector<mint> a(n);
    rep(i, n) {
        INT(ai);
        a[i] = ai;
    }
    auto f = sum_of_powers(a, m);
    rep(i, 1, m + 1) cout << f[i].val() << " \n"[i == m];
}
int main() {
    cin.tie(nullptr);
    ios::sync_with_stdio(false);
    solve();
}

Test cases

Env	Name	Status	Elapsed	Memory
g++	00	AC	5 ms	4 MB
g++	01	AC	4 ms	4 MB
g++	10	AC	5 ms	4 MB
g++	11	AC	192 ms	11 MB
g++	12	AC	193 ms	12 MB
g++	13	AC	193 ms	11 MB