This submission is migrated from previous version of oj.uz, which used different machine for grading. This submission may have different result if resubmitted.
#include <bits/stdc++.h>
using namespace std;
struct Line
{
    long a, b;
    int idx;
};
__float128 isect(Line v1, Line v2)
{
    auto [a1, b1, i1] = v1;
    auto [a2, b2, i2] = v2;
    return (b2 - b1) / (__float128)(a1 - a2);
}
long eval(Line v, long x)
{
    auto [a, b, i] = v;
    return a * x + b;
}
struct CHT
{
    deque<Line> lines;
    // insert ax+b line, a should be increasing
    void push_line(Line l)
    {
        if (lines.empty())
            lines.push_back(l);
        if (lines.back().a == l.a && lines.back().b >= l.b)
            return;
        while (lines.size() >= 2 &&
               isect(*lines.rbegin(), *next(lines.rbegin())) >= isect(*lines.rbegin(), l))
            lines.pop_back();
        lines.push_back(l);
    }
    // queries x, find max(ax+b) x should be increasing
    pair<long, int> query(long x)
    {
        while (lines.size() >= 2 &&
               eval(*lines.begin(), x) <= eval(*next(lines.begin()), x))
            lines.pop_front();
        return make_pair(eval(*lines.begin(), x), lines.begin()->idx);
    }
};
pair<long, vector<int>> solve(vector<long> A, int K)
{
    int N = A.size();
    vector<long> S(N + 1);
    vector<long> pD(N + 1);
    vector<vector<int>> bktk(K + 1, vector<int>(N + 1));
    for (int i = 0; i < N; ++i)
        S[i + 1] = S[i] + A[i];
    for (int k = 1; k <= K; ++k)
    {
        CHT cht;
        vector<long> D(N + 1);
        cht.push_line({S[N], 0L, 0});
        for (int i = 1; i <= N; ++i)
        {
            auto [v, q] = cht.query(S[i]);
            bktk[k][i] = q;
            D[i] = -S[i] * S[i] + v;
            cht.push_line({S[N] + S[i],
                           pD[i] - S[i] * S[N],
                           i});
        }
        pD = D;
    }
    int cur = max_element(pD.begin(), pD.end()) - pD.begin();
    long ans = pD[cur];
    vector<int> ret(K);
    for (int k = K; k >= 1; --k)
    {
        ret[k - 1] = cur;
        cur = bktk[k][cur];
    }
    return {ans, ret};
}
int main()
{
    int N, K;
    cin >> N >> K;
    vector<long> A(N);
    for (auto &x : A)
        cin >> x;
    auto [ans, res] = solve(A, K);
    cout << ans << endl;
    for (int x : res)
        cout << x << " ";
    cout << endl;
}
| # | Verdict | Execution time | Memory | Grader output | 
|---|
| Fetching results... | 
| # | Verdict | Execution time | Memory | Grader output | 
|---|
| Fetching results... | 
| # | Verdict | Execution time | Memory | Grader output | 
|---|
| Fetching results... | 
| # | Verdict | Execution time | Memory | Grader output | 
|---|
| Fetching results... | 
| # | Verdict | Execution time | Memory | Grader output | 
|---|
| Fetching results... | 
| # | Verdict | Execution time | Memory | Grader output | 
|---|
| Fetching results... |