利用堆排序找出数组中前n大的元素

Posted 阿汤的博客

tags:

篇首语:本文由小常识网(cha138.com)小编为大家整理,主要介绍了利用堆排序找出数组中前n大的元素相关的知识,希望对你有一定的参考价值。

#include <stdio.h>
#include <stdint.h>
#include <stdlib.h>
#include <time.h>
#define MAX_SIZE 400001

#define PARENT(i) (i/2)
#define RIGHT(i) (i*2 + 1)
#define LEFT(i) (i*2)
#define EXCHANGE(a,b,t) do{t=a;a=b;b=t;}while(0)

// 生成不重复的随机数序列写入文件
void gen_test_data(uint32_t cnt)
{
    if( cnt >= MAX_SIZE){printf("cnt too largr\n");return;}
    uint32_t i = 0;
    char buf[MAX_SIZE];
    for(;i < cnt;++i){buf[i] = 1;}
    uint32_t n = 0;
    char file_name[256];
    snprintf(file_name,256,"test_data_%d.txt",cnt);
    FILE *fp = fopen(file_name,"w");
    if(NULL == fp){printf("open %s error!\n",file_name);return;}
    while(n < cnt)
    {
        int32_t nRand = rand() % cnt;
        while(buf[nRand] == 0)nRand = (nRand + 1)%cnt;
        buf[nRand] = 0;
        fprintf(fp,"%d ",nRand);
        ++n;
    }
    fclose(fp);
}

// 读取文件
void read_data(int32_t arr[],const uint32_t size,uint32_t *cnt,const int32_t data_cnt)
{
    FILE *fp = NULL;
    char file_name[256];
    if(data_cnt > size){printf("data_cnt too largr\n");return;}
    snprintf(file_name,256,"test_data_%d.txt",data_cnt);
    fp = fopen(file_name,"r");
    if(NULL == fp){printf("open %s error!\n",file_name);return;}
    while(!feof(fp) && *cnt < size)
    {
        fscanf(fp,"%d ",&arr[*cnt]);
        (*cnt)++;
    }
    fclose(fp);
}

// 快速排序
void quick_sort(int32_t arr[],int32_t low,int32_t high)
{
    if(low >= high)return;
    int32_t i = low,j = high,tmp = arr[i];
    while(i<j)
    {
        while(i<j && arr[j] <= tmp)j--;
        if(i<j){arr[i] = arr[j];i++;}
        while(i<j && arr[i] > tmp)i++;
        if(i<j){arr[j] = arr[i];j--;}
    }
    arr[i] = tmp;
    quick_sort(arr,low,i-1);
    quick_sort(arr,i+1,high);
}

void max_heapify(int32_t arr[],const uint32_t size,uint32_t i)
{
    int32_t left = LEFT(i),right = RIGHT(i),largest = 0,tmp = 0;
    if(left<size && arr[left] > arr[i])largest = left;
    else largest = i;
    if(right<size && arr[right] > arr[largest])largest = right;
    if(largest != i)
    {
        EXCHANGE(arr[i],arr[largest],tmp);
        max_heapify(arr,size,largest);
    }
}

void min_heapify(int32_t arr[],const uint32_t size,uint32_t i)
{
    int32_t left = LEFT(i),right = RIGHT(i),largest = 0,tmp = 0;
    if(left<size && arr[left] < arr[i])largest = left;
    else largest = i;
    if(right<size && arr[right] < arr[largest])largest = right;
    if(largest != i)
    {
        EXCHANGE(arr[i],arr[largest],tmp);
        min_heapify(arr,size,largest);
    }
}

void get_topn_heap(int32_t arr[], const int32_t arr_size, const int32_t topn)
{
    int32_t i = topn / 2, tmp = 0;
    // 在[0--topn)范围内构建最小堆,即优先级队列
    while (i >= 0)min_heapify(arr, topn, i--);
    for (i = topn; i < arr_size; ++i)
    {
        if (arr[i] < arr[0])continue;    //小于最小值,没有判断的必要
        EXCHANGE(arr[0], arr[i], tmp);
        min_heapify(arr, topn, 0);
    }
}

void dump1(int32_t arr[],const uint32_t cnt)
{
    uint32_t i = 0;
    for(;i < cnt;++i)
    {
        printf("%4d ",arr[i]);
    }
    printf("\n");
}



void dump2(int32_t arr[],const uint32_t start,const int32_t end)
{
    uint32_t i = start;
    for(;i < end;++i)
    {
        printf("%5d ",arr[i]);
    }
    printf("\n");
}

int32_t main(int32_t argc, char *argv[])
{
    uint32_t data_cnt = 40000,topn = 10;
    int32_t arr[MAX_SIZE];
    uint32_t cnt = 0;
    gen_test_data(data_cnt);
    read_data(arr, MAX_SIZE, &cnt, data_cnt);
    get_topn_heap(arr,cnt,topn);
    quick_sort(arr,0,topn-1);
    dump2(arr,0,topn);
    return 0;
}

 

以上是关于利用堆排序找出数组中前n大的元素的主要内容,如果未能解决你的问题,请参考以下文章

编写程序,找出数组a中前n个元素中的最小元素及其下标

最小的K个数

求第K大算法总结

求第K大算法总结

求第K大算法总结

Top K以及java priorityqueue