合并排序功能

时间:2013-02-12 02:55:00

标签: c merge sorting

我正在尝试使用与C库中定义的qsort函数相同的参数来递归调用合并排序函数的算法。但是,尽管打印出我的值,但它们并不合适。有人可以看看我的功能并告诉我如何纠正这个问题?我还包括我使用的比较功能。提前谢谢

  int cmp (const void *first, const void *second)
    {  
        if (first < second)
            return -1;
        else if (first > second)
            return 1;
        else
            return 0;
    }



    static void msort (void *b,size_t n,size_t s, int(*cmp)(const void*,const void*) )

    {
        char *tmp;

        void *t;
        if ((t = malloc(s*n)) == NULL)
        {
            printf("\nError: No Memory.");
            return;
        }   
        char *b1, *b2;
        size_t n1, n2;



        n1 = n / 2;
        n2 = n - n1;
        b1 = b;
        b2 = (char *) b + (n1 * s);

        if (n2 <= n1)
            return;

        msort (b1, n2, s, cmp);
        msort (b2, n1+1, s, cmp);

        tmp = t;

        while (n1 > 0 && n2 > 0)
        {
            if ((*cmp) (b1, b2) <= 0)
            {
                memcpy (tmp, b1, s);
                tmp += s;
                b1 += s;
                --n1;
            }
            else
            {
                memcpy (tmp, b2, s);
                tmp += s;
                b2 += s;
                --n2;
            }
        }
        if (n1 > 0)
            memcpy (tmp, b1, n1 * s);
        memcpy (b, t, (n - n2) * s);
    } 

这是我的主要内容。我遗漏了你在这里看到的一些功能。

int main()
{
    int n;
    int *a, *b, *c;

printf("enter n: ");
if(scanf("%d", &n) != 1 || n < 10)
{
    fprintf(stderr, "bad input.  goodbye\n");
    abort();
}

printf("sizeof(double) %d\n", sizeof(double) );

printf("running experiments with n=%d\n", n);

a = gen_int_array(n, 5000);
//b = clone_int_array(a, n);
c = clone_int_array(a, n);


//ssort(a, n);
//isort(b, n);
//msort_int(c, n);

//msort_int(d, n);
msort (c, n, sizeof(int), cmp );



if(n<50)
dump_int_array(c, n);

free(a);
free(b );
free(c);

}

1 个答案:

答案 0 :(得分:1)

一个问题是你的比较功能;它正在比较两个指针,这就是全部 - 而不是指向的值。由于您没有向我们展示您要合并排序的数组的定义,因此我们无法轻松提供更多帮助。但是,假设您正在对int数组进行排序,那么比较器可能是:

int comparator(void const *v1, void const *v2)
{
    int i1 = *(int *)v1;
    int i2 = *(int *)v2;
    if (i1 < i2)
        return -1;
    else if (i1 > i2)
        return +1;
    else
        return 0;
}

请注意,此公式可避免算术溢出和其他此类未定义的行为。它也是比较结构和其他更复杂值的合适模板;您可以添加更多对<>测试,直到您没有更多标准来分隔两个值。

我们还可以观察到代码中确实存在内存泄漏。您在函数内部分配一个数组,但不释放它或返回指向它的指针。


原始msort()comparator()

的SSCCE

SSCCE是Short, Self-Contained, Correct Example

#include <stdio.h>
#include <stdlib.h>
#include <string.h>

static int comparator(void const *v1, void const *v2)
{
    int i1 = *(int *)v1;
    int i2 = *(int *)v2;
    if (i1 < i2)
        return -1;
    else if (i1 > i2)
        return +1;
    else
        return 0;
}

static void sort_check(int *array, size_t n)
{
    size_t fail = 0;

    for (size_t i = 1; i < n; i++)
    {
        if (array[i-1] > array[i])
        {
            fprintf(stderr, "Elements %zu (value %d) and %zu (value %d) are out of order\n",
                    i-1, array[i-1], i, array[i]);
            fail++;
        }
    }
    if (fail != 0)
        exit(1);
}

static void msort(void *b, size_t n, size_t s, int(*cmp)(const void*, const void*) )
{
    char *tmp;
    void *t;

    if ((t = malloc(s*n)) == NULL)
    {
        fprintf(stderr, "Error: No Memory.\n");
        return;
    }

    char *b1, *b2;
    size_t n1, n2;

    n1 = n / 2;
    n2 = n - n1;
    b1 = b;
    b2 = (char *) b + (n1 * s);

    if (n2 <= n1)
        return;

    msort (b1, n2, s, cmp);
    msort (b2, n1+1, s, cmp);

    tmp = t;

    while (n1 > 0 && n2 > 0)
    {
        if ((*cmp) (b1, b2) <= 0)
        {
            memcpy (tmp, b1, s);
            tmp += s;
            b1 += s;
            --n1;
        }
        else
        {
            memcpy (tmp, b2, s);
            tmp += s;
            b2 += s;
            --n2;
        }
    }
    if (n1 > 0)
        memcpy (tmp, b1, n1 * s);
    memcpy (b, t, (n - n2) * s);
}

static int *gen_int_array(size_t n, int max_val)
{
    int *a = malloc(n * sizeof(*a));
    if (a == 0)
    {
        fprintf(stderr, "Out of memory.\n");
        exit(1);
    }
    for (size_t i = 0; i < n; i++)
        a[i] = rand() % max_val;
    return(a);
}

static int *clone_int_array(int *master, size_t n)
{
    int *a = malloc(n * sizeof(*a));
    if (a == 0)
    {
        fprintf(stderr, "Out of memory.\n");
        exit(1);
    }
    for (size_t i = 0; i < n; i++)
        a[i] = master[i];
    return(a);
}

static void dump_array(FILE *fp, char const *tag, int *a, size_t n)
{
    char const *pad = "";
    fprintf(fp, "Array: %s (size %zu)\n", tag, n);
    for (size_t i = 0; i < n; i++)
    {
        fprintf(fp, "%s%d", pad, a[i]);
        pad = ",";
    }
    putc('\n', fp);
}

int main(int argc, char **argv)
{
    int n;
    int *a, *b;

    if (argc == 1)
        n = 10;
    else
        n = atoi(argv[1]);
    if (n <= 0)
        n = 10;

    printf("running experiments with n = %d\n", n);

    a = gen_int_array(n, 5000);
    b = clone_int_array(a, n);

    dump_array(stdout, "Unsorted", a, n);

    printf("Q-Sort\n");
    qsort(a, n, sizeof(int), comparator);
    dump_array(stdout, "Q-sorted", a, n);
    sort_check(a, n);

    printf("M-Sort\n");
    msort(b, n, sizeof(int), comparator);
    dump_array(stdout, "M-sorted", b, n);
    sort_check(b, n);

    free(a);
    free(b);

    return(0);
}

此输出(在Mac OS X 10.7.5上没有参数)是:

running experiments with n = 10
Array: Unsorted (size 10)
1807,249,73,3658,3930,1272,2544,878,2923,2709
Q-Sort
Array: Q-sorted (size 10)
73,249,878,1272,1807,2544,2709,2923,3658,3930
M-Sort
Array: M-sorted (size 10)
1807,249,73,3658,3930,1272,2544,878,2923,2709
Elements 0 (value 1807) and 1 (value 249) are out of order
Elements 1 (value 249) and 2 (value 73) are out of order
Elements 4 (value 3930) and 5 (value 1272) are out of order
Elements 6 (value 2544) and 7 (value 878) are out of order
Elements 8 (value 2923) and 9 (value 2709) are out of order

如您所见,qsort()以正确的顺序获取数据。 msort()不会改变任何顺序。测试工具未设置为管理0行数据,但运行msort 1msort()函数获取核心转储。当退化情况因分段错误而失败时,这总是一个不好的迹象。

尺寸1问题(和尺寸0)是通过检查n上的msort()n <= 1时返回来修复的。

下一个问题是if (n2 <= n1);它提前返回。实际上,这个条件总是触发n的偶数值;当你以奇数值n开始时,递归会生成一个偶数值,并且早期的返回会启动。因此,排序永远不会发生。这是演示此行为的函数的(部分)检测版本:

static void msort(void *b, size_t n, size_t s, int (*cmp)(const void *v1, const void *v2) )
{
    if (n <= 1)
        return;     /* Already sorted */

    printf("-->> msort(%zu)\n", n);
    void *t = malloc(s*n);

    if (t == NULL)
    {
        fprintf(stderr, "Error: No Memory.\n");
        printf("<<-- msort(%zu)\n", n);
        return;
    }

    size_t n1 = n / 2;
    size_t n2 = n - n1;

    if (n2 <= n1)
    {
        fprintf(stderr, "Oops: %zu <= %zu\n", n2, n1);
        free(t);
        printf("<<-- msort(%zu)\n", n);
        return;
    }

    char *b1 = b;
    char *b2 = (char *) b + (n1 * s);

    msort(b1, n2, s, cmp);
    msort(b2, n1+1, s, cmp);

    char *tmp = t;

    while (n1 > 0 && n2 > 0)
    {
        if ((*cmp)(b1, b2) <= 0)
        {
            memcpy(tmp, b1, s);
            tmp += s;
            b1 += s;
            --n1;
        }
        else
        {
            memcpy(tmp, b2, s);
            tmp += s;
            b2 += s;
            --n2;
        }
    }
    if (n1 > 0)
        memcpy(tmp, b1, n1 * s);
    memcpy(b, t, (n - n2) * s);
    free(t);
    printf("<<-- msort(%zu)\n", n);
}

示例运行:

running experiments with n = 1
Array: Unsorted (size 1)
1807
Q-Sort
Array: Q-sorted (size 1)
1807
M-Sort
Array: M-sorted (size 1)
1807

running experiments with n = 2
Array: Unsorted (size 2)
1807,249
Q-Sort
Array: Q-sorted (size 2)
249,1807
M-Sort
-->> msort(2)
Oops: 1 <= 1
<<-- msort(2)
Array: M-sorted (size 2)
1807,249
Elements 0 (value 1807) and 1 (value 249) are out of order

running experiments with n = 3
Array: Unsorted (size 3)
1807,249,73
Q-Sort
Array: Q-sorted (size 3)
73,249,1807
M-Sort
-->> msort(3)
-->> msort(2)
Oops: 1 <= 1
<<-- msort(2)
-->> msort(2)
Oops: 1 <= 1
<<-- msort(2)
<<-- msort(3)
Array: M-sorted (size 3)
249,73,1807
Elements 0 (value 249) and 1 (value 73) are out of order

running experiments with n = 4
Array: Unsorted (size 4)
1807,249,73,3658
Q-Sort
Array: Q-sorted (size 4)
73,249,1807,3658
M-Sort
-->> msort(4)
Oops: 2 <= 2
<<-- msort(4)
Array: M-sorted (size 4)
1807,249,73,3658
Elements 0 (value 1807) and 1 (value 249) are out of order
Elements 1 (value 249) and 2 (value 73) are out of order

running experiments with n = 5
Array: Unsorted (size 5)
1807,249,73,3658,3930
Q-Sort
Array: Q-sorted (size 5)
73,249,1807,3658,3930
M-Sort
-->> msort(5)
-->> msort(3)
-->> msort(2)
Oops: 1 <= 1
<<-- msort(2)
-->> msort(2)
Oops: 1 <= 1
<<-- msort(2)
<<-- msort(3)
-->> msort(3)
-->> msort(2)
Oops: 1 <= 1
<<-- msort(2)
-->> msort(2)
Oops: 1 <= 1
<<-- msort(2)
<<-- msort(3)
<<-- msort(5)
Array: M-sorted (size 5)
249,73,1807,3658,3930
Elements 0 (value 249) and 1 (value 73) are out of order

running experiments with n = 6
Array: Unsorted (size 6)
1807,249,73,3658,3930,1272
Q-Sort
Array: Q-sorted (size 6)
73,249,1272,1807,3658,3930
M-Sort
-->> msort(6)
Oops: 3 <= 3
<<-- msort(6)
Array: M-sorted (size 6)
1807,249,73,3658,3930,1272
Elements 0 (value 1807) and 1 (value 249) are out of order
Elements 1 (value 249) and 2 (value 73) are out of order
Elements 4 (value 3930) and 5 (value 1272) are out of order

这是你的问题...我已经展示了一些调试技术,并诊断出一些问题。请注意,跟踪功能进入和退出可能会有所帮助(虽然我作弊并且没有诊断0或1进/出大小)。特别是在递归代码中,识别函数的关键参数(这里是n有很多帮助,虽然数组的起始地址也可能是相关的),因此可以检测到单独的调用。


我感到无聊,或粗心,或某事......这段代码有效。递归调用的更改,合并循环结束时的清理以及复制回原始数组。并完全删除了可疑的if (n2 <= n1)块;我无法解决它的目的。哦,以及更多诊断,进入和退出时打印阵列。

static void msort(void *b, size_t n, size_t s, int (*cmp)(const void *v1, const void *v2) )
{
    if (n <= 1)
        return;     /* Already sorted */

    printf("-->> msort(%zu)\n", n);
    dump_array(stdout, "Entry to msort()", (int *)b, n);
    void *t = malloc(s*n);

    if (t == NULL)
    {
        fprintf(stderr, "Error: No Memory.\n");
        printf("<<-- msort(%zu)\n", n);
        return;
    }

    size_t n1 = n / 2;
    size_t n2 = n - n1;

    char *b1 = b;
    char *b2 = (char *) b + (n1 * s);

    msort(b1, n1, s, cmp);
    msort(b2, n2, s, cmp);

    char *tmp = t;

    while (n1 > 0 && n2 > 0)
    {
        if ((*cmp)(b1, b2) <= 0)
        {
            memcpy(tmp, b1, s);
            tmp += s;
            b1 += s;
            --n1;
        }
        else
        {
            memcpy(tmp, b2, s);
            tmp += s;
            b2 += s;
            --n2;
        }
    }
    if (n1 > 0)
        memcpy(tmp, b1, n1 * s);
    else if (n2 > 0)
        memcpy(tmp, b2, n2 * s);
    memcpy(b, t, n * s);
    free(t);

    dump_array(stdout, "Exit from msort()", (int *)b, n);
    printf("<<-- msort(%zu)\n", n);
}