1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129
| #include <cstdio> #include <vector> #include <algorithm> using namespace std; template <class Type> void read(Type &x) { char c; bool flag = false; while ((c = getchar()) < '0' || c > '9') c == '-' && (flag = true); x = c - '0'; while ((c = getchar()) >= '0' && c <= '9') x = (x << 3) + (x << 1) + c - '0'; if (flag) x = ~x + 1; } template <class Type, class ...rest> void read(Type &x, rest &...y) { read(x), read(y...); } template <class Type> void write(Type x) { if (x < 0) putchar('-'), x = ~x + 1; if (x > 9) write(x / 10); putchar(x % 10 + '0'); } typedef __int128 L; typedef long long LL; const int N = 1e5 + 10, p1 = 998244353, p2 = 1004535809, p3 = 469762049, p = 1e9 + 7; const L mul = (L)p1 * p2 * p3; int w[N]; template <const int &mod> struct NTT { int rev[N]; int binpow (int b, int k = mod - 2) { int res = 1; for (; k; k >>= 1, b = (LL)b * b % mod) if (k & 1) res = (LL)res * b % mod; return res; } void ntt (int *x, int bit, int op) { int tot = 1 << bit; for (int i = 0; i < tot; ++i) if ((rev[i] = rev[i >> 1] >> 1 | ((i & 1) << bit - 1)) > i) swap(x[rev[i]], x[i]); for (int mid = 1; mid < tot; mid <<= 1) { int w1 = binpow(3, (mod - 1) / (mid << 1)); if (!~op) w1 = binpow(w1); for (int i = 0; i < tot; i += mid << 1) for (int j = 0, k = 1; j < mid; ++j, k = (LL)k * w1 % mod) { int p = x[i | j], q = (LL)k * x[i | j | mid] % mod; x[i | j] = (p + q) % mod, x[i | mid | j] = (p - q) % mod; } } if (~op) return; int itot = binpow(tot); for (int i = 0; i < tot; ++i) x[i] = (LL)x[i] * itot % mod; } void PolyMul (int n, vector <int> &f, int m, vector <int> &g, int nm, vector <int> &w) { static int A[N], B[N], C[N]; for (int i = 0; i <= n; ++i) A[i] = f[i] % mod; for (int i = 0; i <= m; ++i) B[i] = g[i] % mod; int bit = 1; while (n + m + 1 > 1 << bit) ++bit; int tot = 1 << bit; for (int i = n + 1; i < tot; ++i) A[i] = 0; for (int i = m + 1; i < tot; ++i) B[i] = 0; ntt(A, bit, 1), ntt(B, bit, 1); for (int i = 0; i < tot; ++i) C[i] = (LL)A[i] * B[i] % mod; ntt(C, bit, -1); for (int i = 0; i <= nm; ++i) w[i] = C[i]; } }; NTT <p1> q1; NTT <p2> q2; NTT <p3> q3; int CRT (int x1, int x2, int x3) { L res = 0; res += (L)x1 * p2 * p3 * q1.binpow((LL)p2 * p3 % p1); res += (L)x2 * p1 * p3 * q2.binpow((LL)p1 * p3 % p2); res += (L)x3 * p1 * p2 * q3.binpow((LL)p1 * p2 % p3); res %= mul; if (res >= (L)p * p * N) res -= mul; if (res <= -(L)p * p * N) res += mul; return res % p; } void solve (int l, int r, int &k, vector <int> &g) { if (l == r) return g[0] = w[l], g[1] = -1, void(); int mid = l + r >> 1; int nm = min(k, r - l + 1), n = min(k, mid - l + 1), m = min(k, r - mid); vector <int> A, B, C, D, E; A.resize(n + 1); B.resize(m + 1); C.resize(nm + 1), D.resize(nm + 1), E.resize(nm + 1); solve(l, mid, k, A), solve(mid + 1, r, k, B); q1.PolyMul(n, A, m, B, nm, C); q2.PolyMul(n, A, m, B, nm, D); q3.PolyMul(n, A, m, B, nm, E); for (int i = 0; i <= nm; ++i) g[i] = CRT(C[i], D[i], E[i]); } int binpow (int b, int k = p - 2) { int res = 1; for (; k; k >>= 1, b = (LL)b * b % p) if (k & 1) res = (LL)res * b % p; return res; } int main () { int n, m; read(n, m); int tot = 1; for (int i = 1; i <= n; ++i) read(w[i]), tot = (LL)tot * w[i] % p; vector <int> A; A.resize(min(m, n) + 1); solve(1, n, m, A); int res = 0; for (int i = 0, t = 1; i <= min(n, m); t = (LL)t * (m - i++) % p) (res += (LL)binpow(n, m - i) * t % p * A[i] % p) %= p; write(((tot - (LL)res * binpow(binpow(n, m))) % p + p) % p); return 0; }
|