算法设计与分析实验指导1——快速排序及第k小数

最新推荐文章于 2023-01-15 21:36:36 发布

ShowM3TheCode

最新推荐文章于 2023-01-15 21:36:36 发布

阅读量298

点赞数

分类专栏：学校课程作业之路文章标签：算法排序算法数据结构

本文链接：https://blog.csdn.net/ShowMeTheCod3/article/details/124892278

版权

学校课程作业之路专栏收录该内容

5 篇文章 5 订阅

订阅专栏

文章目录

- 1. 快速排序及第k小数

1. 快速排序及第k小数

1.1 快速排序

1.1.1 Implementation 1

核心代码如下：

int partition(vector<int> &nums, int l, int r) {
    int i = l;
    int j = r;
    while (i < j) {
        while (i < j && nums[i] >= nums[l]) j--;
        while (i < j && nums[i] <= nums[l]) i++;
        swap(nums[i], nums[j]);
    }
    swap(nums[i], nums[l]);
    return i;
}

void quickSort(vector<int> &nums, int l, int r) {
    if (l >= r) return;
    int i = partition(nums, l, r);
    quickSort(nums, l, i - 1);
    quickSort(nums, i + 1, r);
}

1.1.2 算法特性分析

时间复杂度：

最佳Ω(NlogN) ：最佳情况下，每轮哨兵划分操作将数组划分为等长度的两个子数组；哨兵划分操作为线性时间复杂度 O(N)；递归轮数共 O(logN) 。

平均Θ(NlogN) ：在随机输入数组下，哨兵划分操作的递归轮数也为O(logN) 。

最差 O(N^2)：在某些特殊输入数组下，每轮哨兵划分操作都将长度为 N 的数组划分为长度为1和N−1的两个子数组，此时递归轮数达到N 。

虽然平均时间复杂度与「归并排序」和「堆排序」一致，但在实际使用中快速排序效率更高，这是因为：

最差情况稀疏性：虽然快速排序的最差时间复杂度为 O(N^2)，差于归并排序和堆排序，但统计意义上看，这种情况出现的机率很低。大部分情况下，快速排序以 O(NlogN) 复杂度运行。

缓存使用效率高：哨兵划分操作时，将整个子数组加载入缓存中，访问元素效率很高；堆排序需要跳跃式访问元素，因此不具有此特性。

常数系数低：在提及的三种算法中，快速排序的比较、赋值、交换三种操作的综合耗时最低（类似于插入排序快于冒泡排序的原理）。

原地：不用借助辅助数组的额外空间，递归仅使用O(logN) 大小的栈帧空间。

非稳定：哨兵划分操作可能改变相等元素的相对顺序。

自适应：若每轮哨兵划分操作都将长度为 NN 的数组划分为长度1和N−1两个子数组，则时间复杂度劣化至O(N^2)。

1.1.3 Improvement 1: 降低空间复杂度——Tail Call

最坏情况进行N次递归，那么最差时间复杂度会达到O(N)。

每轮递归时，仅对较短的子数组执行哨兵划分 partition() ，就可将最差的递归深度控制在O(logN) （每轮递归的子数组长度都≤ 当前数组长度），即实现最差空间复杂度 O(logN) 。

代码只需修改quick_sort()：

void quickSort(vector<int> &nums, int l, int r) {
	while (l < r) {
        int i = partition(nums, l, r);
        if (i - l < r - i) {
            quickSort(nums, l, i - 1);
            l = i + 1;
        }
        else {
            quickSort(nums, i + 1, r);
            r = i - 1;
        }
    }
}

1.1.3 Improvement 2:避免最坏情况——随机基准数

通过随机函数，随机选取哨兵值，极大程度避免完全有序或者完全倒序的情况下时间复杂度为O(n²)的情况。

partition()代码修改如下：

int partition(vector<int>& nums, int l, int r) {
    // 在闭区间 [l, r] 随机选取任意索引，并与 nums[l] 交换
    int ra = l + rand() % (r - l + 1);
    swap(nums[l], nums[ra]);
    // 以 nums[l] 作为基准数
    int i = l, j = r;
    while (i < j) {
        while (i < j && nums[j] >= nums[l]) j--;
        while (i < j && nums[i] <= nums[l]) i++;
        swap(nums[i], nums[j]);
    }
    swap(nums[i], nums[l]);
    return i;
}

1.2 第k小数

1.2.1 Implementation 1: 基于快排

继承快排的思想，当哨兵位置为k时返回对应值。

partition部分可以继续沿用1.1.3的改进，将quickSort段代码改成如下：

int kMin(vector<int>& nums, int l, int r, int k) {
    int i = partition(nums, l, r);
    if (i == k) {
        return nums[k];
    }
    if (i < k) {
        return kMin(nums, i + 1, r, k);
    }
    else return kMin(nums, l, i - 1, k);
}

该方法的时间复杂度为θ(n)，但是最坏情况达到了O(n²)。

空间复杂度为O(logn)，即递归调用栈空间的空间代价。

1.2.2 Implementation 2: 基于堆排序

堆的性质是每次弹出最小的一个值，那么找第k小的数，也就是调用k次堆的弹出函数。

堆的API如下：

#include <vector>
#include <algorithm>
#include <iostream>
using namespace std;


template<class T> class myHeap {
private:
    T* heap;
    int capacity;
    const int REFACTOR = 2;
    void heapSort(int n);
    void switchSons(int i, int size);
    void topDownHeapify(int maxPos);
public:
    myHeap();
    myHeap(T* array, int size);
    void insert(T item);
    void pop();
    void print();
    T peek();
};

template<class T> myHeap<T>::myHeap() {
    heap = new T[11];
    capacity = 10;
    heap[0] = 0;
}

template<class T> myHeap<T>::myHeap(T* array, int size) {
    heap = new T[size + 1];
    heap[0] = size;
    capacity = size;
    for (int i = 1; i <= size; i++) {
        heap[i] = array[i - 1];
    }
    heapSort(heap[0]);
}

template<class T> void myHeap<T>::heapSort(int size) {
    if (size == 1) return;
    int n = size / 2;
    for (int i = n; i >= 1; i--) {
        switchSons(i, size);
    }
    swap(heap[1], heap[size]);
    heapSort(size - 1);
}

template<class T> void myHeap<T>::switchSons(int i, int size) {
    if (2 * i + 1 > size) {
        if (heap[i] < heap[2 * i]) {
            swap(heap[i], heap[2 * i]);
        }
        return;
    }

    T left = heap[2 * i];
    T right = heap[2 * i + 1];

    if (right > left && right > heap[i]) {
        swap(heap[i], heap[2 * i + 1]);
    }
    else if (left > heap[i]) {
        swap(heap[i], heap[2 * i]);
    }
}

template<class T> void myHeap<T>::print() {
    for (int i = 1; i <= heap[0]; i++) {
        cout << heap[i] << " ";
    }
    cout << endl;
}

template<class T> void myHeap<T>::insert(T item) {
    if (heap[0] == capacity) {
        capacity *= REFACTOR;
        T* tmp = new T[capacity];
        for (int i = 0; i <= heap[0]; i++) {
            tmp[i] = heap[i];
        }
        heap = tmp;
    }
    heap[heap[0] + 1] = item;
    int i = heap[0]++ + 1;
    int j = heap[0] / 2;
    while (j >= 0 && i != 1) {
        if (heap[j] <= item) break;
        heap[i] = heap[j];
        i = j;
        j = i / 2;
    }
    heap[i] = item;
}

template<class T> void myHeap<T>::pop() {
    if (heap[0] == 0) return;
    // print();
    cout << heap[1] << endl;
    swap(heap[1], heap[heap[0]--]);
    // print();

    topDownHeapify(1);
}

template<class T> void myHeap<T>::topDownHeapify(int maxPos) {
    // 已到达叶子结点
    if (maxPos * 2 > heap[0]) return;
    if (maxPos * 2 == heap[0]) {
        if (heap[heap[0]] < heap[maxPos]) swap(heap[maxPos], heap[heap[0]]);
        return;
    }
    int left = heap[maxPos * 2];
    int right = heap[maxPos * 2 + 1];
    if (right < left && right < heap[maxPos]) {
        swap(heap[maxPos], heap[maxPos * 2 + 1]);
        // print();
        topDownHeapify(maxPos * 2 + 1);
    }
    else if (left < heap[maxPos]) {
        swap(heap[maxPos], heap[maxPos * 2]);
        // print();
        topDownHeapify(maxPos * 2);
    }
}

template<class T> T myHeap<T>::peek() {
    if (heap[0] == 0) {
        exit(1);
    }
    return heap[1];
}

通过上述建立的myHeap类，我们求第k小数也可以用如下方法：

int kMin(myHeap<int> &nums, int k) {
    for (int i = 1; i < k; i++) {
        nums.pop();
    }
    return nums.peek();
}

该方法的时间复杂度为θ(nlogn)，但是最坏情况同样达到了O(n²)。

空间复杂度为O(logn)，即递归调用栈空间的空间代价。

1.3 正确性验证

为了验证正确性，选择了LeetCode中的一道题目进行验证。

1.3.1 题目：215. 数组中的第K个最大元素

给定整数数组 nums 和整数 k，请返回数组中第 k个最大的元素。

请注意，你需要找的是数组排序后的第 k 个最大的元素，而不是第 k 个不同的元素。

1.3.2 基于快排的实现

#include <vector>
#include <string>
#include <algorithm>
using namespace std;

class Solution {
public:
    int findKthLargest(vector<int>& nums, int k) {
        int n = nums.size();
        k = n - k;
        return kMin(nums, 0, n - 1, k);
    }

    int partition(vector<int>& nums, int l, int r) {
        int i = l;
        int j = r;
        while (i < j) {
            while (i < j && nums[j] >= nums[l]) j--;
            while (i < j && nums[i] <= nums[l]) i++;
            swap(nums[i], nums[j]);
        }
        swap(nums[i], nums[l]);
        return i;
    }

    int kMin(vector<int>& nums, int l, int r, int k) {
        int i = partition(nums, l, r);
        if (i == k) {
            return nums[k];
        }
        if (i < k) {
            return kMin(nums, i + 1, r, k);
        }
        else return kMin(nums, l, i - 1, k);
    }
};

1.3.3 基于堆排序的实现

#include <vector>
#include <string>
#include <algorithm>
using namespace std;

class Solution {
public:
    int findKthLargest(vector<int>& nums, int k) {
        int n = nums.size();
        k = n - k + 1;
        vector<int> ans(n + 1);
        ans[0] = n;
        for (int i = 1; i <= n; i++) {
            ans[i] = nums[i - 1];
        }
        heapSort(ans, n);
        return ans[k];
    }

    void heapSort(vector<int>& heap, int size) {
        if (size == 1) return;
        int n = size / 2;
        for (int i = n; i >= 1; i--) {
            switchSons(heap, i, size);
        }
        swap(heap[1], heap[size]);
        heapSort(heap, size - 1);
    }

    void switchSons(vector<int>& heap, int i, int size) {
        if (2 * i + 1 > size) {
            if (heap[i] < heap[2 * i]) {
                swap(heap[i], heap[2 * i]);
                }
            return;
        }

        int left = heap[2 * i];
        int right = heap[2 * i + 1];

        if (right > left && right > heap[i]) {
            swap(heap[i], heap[2 * i + 1]);
        }
        else if (left > heap[i]) {
            swap(heap[i], heap[2 * i]);
        }
    }
};

ShowM3TheCode

关注

0
点赞
踩
3

收藏

觉得还不错? 一键收藏
0
评论
算法设计与分析实验指导1——快速排序及第k小数

文章目录1. 快速排序及第k小数1.1 快速排序1.1.1 Implementation 11.1.2 算法特性分析1.1.3 Improvement 1: 降低空间复杂度——Tail Call1.1.3 Improvement 2:避免最坏情况——随机基准数1.2 第k小数1.2.1 Implementation 1: 基于快排1.2.2 Implementation 2: 基于堆排序1.3 正确性验证1.3.1 题目：[215. 数组中的第K个最大元素](https://leetcode.cn/prob
复制链接

扫一扫

专栏目录