Codeforces 1781C. Equal Frequencies

历史记录

清除记录

猜你想搜

AcWing热点
App
登录/注册

Codeforces 1781C. Equal Frequencies 原题链接中等

作者：

pein531 , 2024-01-10 23:06:52 , 所有人可见 , 阅读 65

题目描述

难度分: $1600$

输入 $T(\leq 10^4)$ 表示 $T$ 组数据。所有数据的 $n$ 之和 $\leq 10^5$ 。

每组数据输入 $n(1 \leq n \leq 10^5)$ 和长为 $n$ 的字符串 $s$ ，仅包含小写英文字母。

如果一个字符串中的每个字母的出现次数都相同，我们就称该字符串为平衡字符串。

每次操作，你可以修改一个 $s[i]$ 。

你需要把 $s$ 变成平衡字符串。

输出最少要操作多少次，以及修改后的字符串。如果有多个符合要求的字符串，输出任意一个。

输入样例

4
5
hello
10
codeforces
5
eevee
6
appall

输出样例

1
helno
2
codefofced
1
eeeee
0
appall

算法

枚举+构造

这个题实在不难，但是实现起来感觉特别难受，花了很长时间写了如下冗长的代码，今天实在是优化不动了。

思路很简单，由于 $s$ 串中最多可能有 $26$ 种字母，并且字母种数 $t$ 必须还要能整除 $n$ 才能保证每种字母的频数都相等，因此我们可以枚举这些情况。先枚举出所有可能的字母频数，存入 $cands$ 数组中。

对于 $cands$ 中的每个目标频数 $target$ ，都计算最小操作数。对于目标频数 $target$ ，一共有 $t=\frac{n}{target}$ 种字母，设 $s$ 中原本的字母种数为 $sz$ ，分为以下两种情况：

$sz \leq t$ ，这时候需要添加 $s$ 串中原本不存在的字母，先遍历一遍 $s$ 得到串中原本存在的字母，然后再随便选 $t-sz$ 种 $s$ 串中不存在的字母，每种字母的频数都应该是 $target$ 。
$sz \gt t$ ，这时候不需要添加额外的字母，只需要用 $s$ 串中原本的字母即可。对于某个字母种数 $t$ ，要想操作数达到最小，只需要让 $s$ 只保留 $t$ 种频数大小相邻的字母。预处理得到一个二元组“（字母频数，字母）”数组 $tup$ ，将它按照字母频数排序，用一个长度为 $t$ 的窗口滑动计算每个窗口的最小操作次数即可。

对于以上每种情况，将 $t$ 种字母的频数存入到哈希表 $need$ 中，根据 $need$ 构造答案就行，构造方法详见代码中的 $construt$ 函数。

复杂度分析

时间复杂度

对于情况 $2$ ，每种目标频数 $target$ 都需要对 $tup$ 数组进行排序，情况 $1$ 不需要。但由于 $tup$ 最长就是 $26$ ，所以排序的复杂度可以看成是个很大的常数（准确应该是 $O(\Sigma log_2\Sigma)$ ， $\Sigma$ 是字符集的大小）。

预处理出以上需要的各个哈希表瓶颈在于遍历 $s$ 串，时间复杂度为 $O(n)$ ；而计算出每个目标频数 $target$ 的最小操作次数只需要遍历这些哈希表，可以看成是常数。构造出一个答案只需要遍历有限几次 $s$ 串，时间复杂度也大约是 $O(n)$ 的。综上，整个算法的时间复杂度近似为 $O(n)$ 。

空间复杂度

算法过程中的哈希表都是字符集大小的空间消耗，本题中字符集大小在最差情况下为 $26$ 。而构造出一个答案在 $construc$ 函数中使用了队列来存索引，在最差情况下会消耗 $O(n)$ 级别的空间。因此，算法整体的额外空间复杂度为 $O(n+\Sigma)$ （其中 $\Sigma$ 是字符集的大小）。

C++ 代码

#include <iostream>
#include <cstring>
#include <algorithm>
#include <vector>
#include <unordered_map>
#include <queue>

using namespace std;
const int N = 100010;
int t, n;
char s[N], ans[N];
unordered_map<char, int> counter, extra;

void construct(unordered_map<char, int>& need, int target, bool flag) {
    unordered_map<char, int> cnt;
    queue<int> q;
    if(flag) {
        for(int i = 1; i <= n; i++) {
            if(cnt[s[i]] + 1 <= target) {
                ans[i] = s[i];
                cnt[s[i]]++;
                need[s[i]]--;
                if(cnt[s[i]] == target) {
                    need.erase(s[i]);
                }
            }else {
                q.push(i);
            }
        }
    }else {
        for(int i = 1; i <= n; i++) {
            if(need.find(s[i]) != need.end()) {
                if(cnt[s[i]] + 1 <= target) {
                    ans[i] = s[i];
                    cnt[s[i]]++;
                    need[s[i]]--;
                    if(cnt[s[i]] == target) {
                        need.erase(s[i]);
                    }
                }else {
                    q.push(i);
                }
            }else {
                q.push(i);
            }
        }
    }
    if(need.empty()) return;
    auto it = need.begin();
    while(!q.empty()) {
        int i = q.front();
        q.pop();
        if(it != need.end()) {
            ans[i] = it->first;
            it->second--;
            if(it->second == 0) {
                it++;
            }
        }
    }
}

int main() {
    scanf("%d", &t);
    for(int index = 1; index <= t; index++) {
        scanf("%d", &n);
        scanf("%s", s + 1);
        vector<int> cands;
        counter.clear();
        extra.clear();
        for(int freq = 1; freq <= n; freq++) {
            counter[s[freq]]++;
            if(n % freq == 0 && n / freq <= 26) {
                // 每个字母可能的频数
                cands.push_back(freq);
            }
        }
        for(char c = 'a'; c <= 'z'; c++) {
            if(counter.find(c) == counter.end()) {
                extra[c] = 0;
            }
        }
        int min_op = 0x3f3f3f3f;
        for(int target: cands) {
            int t = n / target;     // 最终字符串中该有的字母种数
            int sz = counter.size();
            unordered_map<char, int> need;
            if(sz <= t) {
                // 缺字母或刚好
                int res = 0;
                auto it = extra.begin();
                for(auto&[letter, cnt]: counter) {
                    need[letter] = target;
                    res += abs(cnt - target);
                }
                while(need.size() < t) {
                    need[it->first] = target;
                    it++;
                    res += target;
                }
                res >>= 1;
                if(res < min_op) {
                    construct(need, target, true);
                    min_op = res;
                }
            }else {
                // 多字母
                vector<pair<int, char>> tup;
                for(auto&[letter, cnt]: counter) {
                    tup.push_back({cnt, letter});
                }
                sort(tup.begin(), tup.end());
                int left = -1, right = -1;
                for(int l = 0; l < sz; l++) {
                    int r;
                    int res = 0;
                    if(l + t - 1 < sz) {
                        r = l + t - 1;
                        int tot = 0;
                        for(int i = l; i <= r; i++) {
                            tot += tup[i].first;
                            res += abs(tup[i].first - target);
                        }
                        res += n - tot;
                    }else {
                        int tot = 0;
                        for(int i = l; i < sz; i++) {
                            tot += tup[i].first;
                            res += abs(tup[i].first - target);
                        }
                        r = t - (sz - l) - 1;
                        for(int i = 0; i <= r; i++) {
                            tot += tup[i].first;
                            res += abs(tup[i].first - target);
                        }
                        res += n - tot;
                    }
                    res >>= 1;
                    if(res < min_op) {
                        min_op = res;
                        left = l, right = r;
                    }
                }
                if(left >= 0 && right >= 0) {
                    if(left <= right) {
                        for(int i = left; i <= right; i++) {
                            need[tup[i].second] = target;
                        }
                    }else {
                        for(int i = left; i < sz; i++) {
                            need[tup[i].second] = target;
                        }
                        for(int i = 0; i <= right; i++) {
                            need[tup[i].second] = target;
                        }
                    }
                    construct(need, target, false);
                }
            }
        }
        printf("%d\n", min_op);
        ans[n + 1] = '\0';
        puts(ans + 1);
    }
    return 0;
}