【算法基础】1.8离散化（区间和：离散化+前缀和）

Wei *

已于 2023-07-14 16:10:50 修改

阅读量381

点赞数 1

分类专栏：算法文章标签：算法 c++ 离散化前缀和 Java

于 2023-01-17 00:00:00 首次发布

本文链接：https://blog.csdn.net/qq_43406895/article/details/128686309

版权

算法专栏收录该内容

69 篇文章 5 订阅

订阅专栏

文章目录

离散化
- 如何离散
- 确定映射方式
例题——区间和⭐⭐⭐⭐⭐（离散化+前缀和）

当数据范围的跨度很大，但是数据很稀疏时，可以使用离散化。

离散化

如何离散

在这里插入图片描述

数据范围很大，但是并不是每个数字都会出现，就可以将原始数据按照顺序映射到一个小的数据范围。

确定映射方式

按照顺序，一对一的方式，比如：
原数据：1, 3, 7, 8, 12, 1000, 99999
就可以映射成：0，1，2，3，4，5，6
其中1->0, 3->1, 7->2, 8->3, 12->4, 1000->5, 99999->6。

如果原始数据有重复，需要排序去重。

如何确定一个数字排在哪个位置呢？可以使用二分。

例题——区间和⭐⭐⭐⭐⭐（离散化+前缀和）

假定有一个无限长的数轴，数轴上每个坐标上的数都是 0。

现在，我们首先进行 n 次操作，每次操作将某一位置 x 上的数加 c。

接下来，进行 m 次询问，每个询问包含两个整数 l 和 r，你需要求出在区间 [l,r] 之间的所有数的和。

在这里插入图片描述

思路

数据范围不大，但是数据的值域很大！——考虑离散化

Q：具体怎么离散化？
A：将各个下标映射到从 0 开始的有序下标。

Q：怎么确定有序下标的范围？
A：用列表存储所有出现的下标，然后去重 + 排序，最后列表的 size 就是映射之后的下标个数。

Q：如何确定每个初始下标映射之后的下标呢？
A：使用二分查找，找到下标列表中第一个 >= x 的元素下标，那就是原始下标 x 映射之后的新下标。

之后使用前缀和来处理这个问题就好了。

代码

Java

import java.util.*;
import java.util.stream.Collectors;

public class Main {
    final static int N = 300010;
    static int n, m;
    static int[] a = new int[N], s = new int[N];

    // alls存储所有的下标
    static List<Integer> alls = new ArrayList<>();
    // add存储所有的加操作，query存储所有的查询
    static List<Pair<Integer, Integer>> add = new ArrayList<>(), query = new ArrayList<>();

    public static void main(String[] args) {
        Scanner scanner = new Scanner(System.in);
        int n = scanner.nextInt(), m = scanner.nextInt();
        for (int i = 0; i < n; ++i) {
            int x = scanner.nextInt(), c = scanner.nextInt();
            add.add(new Pair<>(x, c));
            alls.add(x);
        }
        for (int i = 0; i < m; ++i) {
            int l = scanner.nextInt(), r = scanner.nextInt();
            query.add(new Pair<>(l, r));
            alls.add(l);
            alls.add(r);
        }

        alls = alls.stream().distinct().collect(Collectors.toList());   // 对列表进行去重
        Collections.sort(alls);     // 对所有下标进行排序

        // 处理所有加操作
        for (Pair<Integer, Integer> item: add) a[find(item.x)] += item.y;
        // 求前缀和数组
        for (int i = 0; i < alls.size(); ++i) {
            s[i + 1] = s[i] + a[i];
        }
        for (Pair<Integer, Integer> item: query) {
            int l = find(item.x), r = find(item.y);
            System.out.println(s[r + 1] - s[l]);
        }
    }

    // 找到第一个>=x的下标
    static int find(int x) {
        int l = 0, r = alls.size() - 1;
        while (l < r) {
            int mid = l + r >> 1;
            if (alls.get(mid) >= x) r = mid;
            else l = mid + 1;
        }
        return l;
    }
}

class Pair<T, E> {
    T x;
    E y;

    public Pair(T x, E y) {
        this.x = x;
        this.y = y;
    }
}

Cpp

#include <iostream>
#include <cstring>
#include <algorithm>

using namespace std;

typedef pair<int, int> PII;

const int N = 300010;

int n, m;
int a[N], s[N];

vector<int> alls;
vector<PII> add, query;

int find(int x) {
    int l = 0, r = alls.size() - 1;
    while (l < r) {
        int mid = l + r >> 1;
        if (alls[mid] >= x) r = mid;
        else l = mid + 1;
    }
    return l;
}

int main()
{
    scanf("%d%d", &n, &m);
    for (int i = 0; i < n; i ++ ) {
        int x, c;
        scanf("%d%d", &x, &c);
        add.push_back({x, c});
        alls.push_back(x);
    }
    
    for (int i = 0; i < m; i ++ ) {
        int l, r;
        scanf("%d%d", &l, &r);
        query.push_back({l, r});
        alls.push_back(l);
        alls.push_back(r);
    }
    
    // 去重
    sort(alls.begin(), alls.end());
    alls.erase(unique(alls.begin(), alls.end()), alls.end());
    
    // 处理插入
    for (PII item: add) {
        int x = find(item.first);
        a[x] += item.second;
    }
    
    // 预处理前缀和
    for (int i = 1; i <= alls.size(); i ++ ) s[i] = s[i - 1] + a[i - 1];
    
    // 处理询问
    for (PII item: query) {
        int l = find(item.first), r = find(item.second);
        printf("%d\n", s[r + 1] - s[l]);
    }
    return 0;
}