You are given $n$ arrays that can have different sizes. You also have a table with $w$ columns and $n$ rows. The $i$-th array is placed horizontally in the $i$-th row. You can slide each array within its row as long as it occupies several consecutive cells and lies completely inside the table.
You need to find the maximum sum of the integers in the $j$-th column for each $j$ from $1$ to $w$ independently.
Optimal placements for columns $1$, $2$ and $3$ are shown on the pictures from left to right.
Note that you can exclude any array out of a column provided it remains in the window. In this case its value is considered to be zero.
Input
The first line contains two integers $n$ ($1 \le n \le 10^{6}$) and $w$ ($1 \le w \le 10^{6}$) — the number of arrays and the width of the table.
Each of the next $n$ lines consists of an integer $l_{i}$ ($1 \le l_{i} \le w$), the length of the $i$-th array, followed by $l_{i}$ integers $a_{i1}, a_{i2}, \ldots, a_{il_i}$ ($-10^{9} \le a_{ij} \le 10^{9}$) — the elements of the array.
The total length of the arrays does no exceed $10^{6}$.
Output
Print $w$ integers, the $i$-th of them should be the maximum sum for column $i$.
Examples
input
3 3 3 2 4 8 2 2 5 2 6 3
output
10 15 16
input
2 2 2 7 8 1 -8
output
7 8
Note
Illustration for the first example is in the statement.
Solution:
#include <bits/stdc++.h> using namespace std; template <typename T, class F = function<T(const T&, const T&)>> class SparseTable { public: int n; vector<vector<T>> mat; F func; SparseTable(const vector<T>& a, const F& f) : func(f) { n = static_cast<int>(a.size()); int max_log = 32 - __builtin_clz(n); mat.resize(max_log); mat[0] = a; for (int j = 1; j < max_log; j++) { mat[j].resize(n - (1 << j) + 1); for (int i = 0; i <= n - (1 << j); i++) { mat[j][i] = func(mat[j - 1][i], mat[j - 1][i + (1 << (j - 1))]); } } } T get(int from, int to) const { assert(0 <= from && from <= to && to <= n - 1); int lg = 32 - __builtin_clz(to - from + 1) - 1; return func(mat[lg][from], mat[lg][to - (1 << lg) + 1]); } }; int main() { ios::sync_with_stdio(false); cin.tie(0); int cnt, w; cin >> cnt >> w; vector<long long> res(w + 1); while (cnt--) { int n; cin >> n; vector<int> a(n); for (int i = 0; i < n; i++) { cin >> a[i]; } SparseTable<int> st(a, [&](int i, int j) { return max(i, j); }); for (int i = 0; i < w; i++) { int from = max(i - (w - n), 0); int to = min(i, n - 1); int cur = st.get(from, to); if (cur < 0 && (i >= n || i < w - n)) { cur = 0; } res[i] += cur; if (from == 0 && to == n - 1 && i >= n && w >= 2 * n + 1) { i = max(i, w - n - 1); } res[i + 1] -= cur; } } for (int i = 0; i < w; i++) { if (i > 0) { cout << " "; } cout << res[i]; res[i + 1] += res[i]; } cout << '\n'; return 0; }