order.c 10.1 KB
/**********************************************************************/
/*                                                                    */
/*             FILENAME:  order.c                                     */
/*             BY:  Jonathan G. Fiscus                                */
/*                  NATIONAL INSTITUTE OF STANDARDS AND TECHNOLOGY    */
/*                  SPEECH RECOGNITION GROUP                          */
/*                                                                    */
/*           DESC:  this file contains routines to sort and rank      */
/*                  various types of numeric arrays in INCREASING     */
/*                  of DECREASING order                               */
/*                                                                    */
/**********************************************************************/
#include "sctk.h"


/**********************************************************************/
/* qsort short comparison functions  */
int qsort_short_cmp(const void *p, const void *p1);

int qsort_short_deccmp(const void *p, const void *p1);

static short *short_cmp_arr;
int qsort_short_cmp(const void *p, const void *p1){
    return(short_cmp_arr[*((int *)p)] - short_cmp_arr[*((int *)p1)]);
}
int qsort_short_deccmp(const void *p, const void *p1){
    return(short_cmp_arr[*((int *)p1)] - short_cmp_arr[*((int *)p)]);
}

/**********************************************************************/
/* qsort int comparison functions  */
int qsort_int_cmp(const void *p, const void *p1);
int qsort_int_deccmp(const void *p, const void *p1);

static int *int_cmp_arr;
int qsort_int_cmp(const void *p, const void *p1){
    return(int_cmp_arr[*((int *)p)] - int_cmp_arr[*((int *)p1)]);
}
int qsort_int_deccmp(const void *p, const void *p1){
    return(int_cmp_arr[*((int *)p1)] - int_cmp_arr[*((int *)p)]);
}
int qsort_int_compare(const void *i, const void *j) {
    return(*((int *)i) - *((int *)j)); 
}
 



/**********************************************************************/
/* qsort double comparison functions  */
int qsort_double_cmp(const void *p, const void *p1);
int qsort_double_deccmp(const void *p, const void *p1);

static double *double_cmp_arr;
int qsort_double_cmp(const void *p, const void *p1){
    double f = double_cmp_arr[*((int *)p)] - double_cmp_arr[*((int *)p1)];
    return((f < 0.0) ? -1 : ((f > 0) ? 1 : 0));
}
int qsort_double_deccmp(const void *p, const void *p1){
    double f = double_cmp_arr[*((int *)p1)] - double_cmp_arr[*((int *)p)];
    return((f < 0.0) ? -1 : ((f > 0) ? 1 : 0));
}
int qsort_double_compare(const void *i, const void *j) {
    double f = *((double *)i) - *((double *)j);
    return((f < 0.0) ? -1 : ((f > 0) ? 1 : 0));
}

/**********************************************************************/
/*   Sort a short array                                               */
/*        arr -> the short array                                      */
/*        ptr_arr -> an integer array of indexes into arr.            */
/*                   using this array to index arr, sorts the arr     */
/**********************************************************************/
void sort_short_arr(short int *arr, int num, int *ptr_arr, int order)
{
    int j;
    /* init the indexes to 1-n */ 
    for (j=0;j<num;j++)
        ptr_arr[j] = j;

    short_cmp_arr = arr;
    if (order == INCREASING)
	qsort((void *)ptr_arr,num,sizeof(int),qsort_short_cmp);
    else
	qsort((void *)ptr_arr,num,sizeof(int),qsort_short_deccmp);
}


/**********************************************************************/
/*   Sort a double array                                               */
/*        arr -> the double array                                      */
/*        ptr_arr -> an integer array of indexes into arr.            */
/*                   using this array to index arr, sorts the arr     */
/**********************************************************************/
void sort_double_arr(double *arr, int num, int *ptr_arr, int order)
{
    int j;
    /* init the indexes to 1-n */ 
    for (j=0;j<num;j++)
        ptr_arr[j] = j;

    double_cmp_arr = arr;
    if (order == INCREASING)
	qsort((void *)ptr_arr,num,sizeof(int),qsort_double_cmp);
    else
	qsort((void *)ptr_arr,num,sizeof(int),qsort_double_deccmp);
}

/**********************************************************************/
/*   Sort a int array                                                 */
/*        arr -> the int array                                        */
/*        ptr_arr -> an integer array of indexes into arr.            */
/*                   using this array to index arr, sorts the arr     */
/**********************************************************************/
void sort_int_arr(int *arr, int num, int *ptr_arr, int order)
{
    int j;
    /* init the indexes to 1-n */ 
    for (j=0;j<num;j++)
        ptr_arr[j] = j;

    int_cmp_arr = arr;
    if (order == INCREASING)
	qsort((void *)ptr_arr,num,sizeof(int),qsort_int_cmp);
    else
	qsort((void *)ptr_arr,num,sizeof(int),qsort_int_deccmp);
}

/**********************************************************************/
/*   Sort an array strings. to access the results, a double           */
/*   indirection is needed.                                           */
/*        arr -> the 2 dimarr of chars                                */
/**********************************************************************/
void sort_strings_using_index(char **arr, int *ind, int num, int order)
{
    int i, j, tmp;

    for (i=0;i<num;i++)
	ind[i] = i;

    if (order == DECREASING){
        for (j=num;j>0;j--){
            for (i=0;i<j-1;i++)
		if (strcmp(arr[ind[i]],arr[ind[i+1]]) < 0){
                    tmp = ind[i];
                    ind[i] = ind[i+1];
                    ind[i+1] = tmp;
	        }
	}
    }
    else{
        for (j=num;j>0;j--)
            for (i=0;i<j-1;i++)
                if (strcmp(arr[ind[i]],arr[ind[i+1]]) > 0){
                    tmp = ind[i];
                    ind[i] = ind[i+1];
                    ind[i+1] = tmp;
	        }
    }
/*    printf("sort debug\n");
    for (i=0;i<num;i++)
	printf("  %d arr[%d]-> %s \n",i,ind[i],arr[ind[i]]);*/

}

/**********************************************************************/
/*   Sort an array strings in place                                   */
/*        arr -> the 2 dimarr of chars                                */
/**********************************************************************/
void sort_strings_in_place(char **arr, int num, int order)
{
    int i, j;
    char *tmp;

    if (order == DECREASING){
        for (j=num;j>0;j--){
            for (i=0;i<j-1;i++)
                if (strcmp(arr[i],arr[i+1]) < 0){
                    tmp = arr[i];
                    arr[i] = arr[i+1];
                    arr[i+1] = tmp;
	        }
	}
    }
    else{
        for (j=num;j>0;j--)
            for (i=0;i<j-1;i++)
                if (strcmp(arr[i],arr[i+1]) > 0){
                    tmp = arr[i];
                    arr[i] = arr[i+1];
                    arr[i+1] = tmp;
	        }
    }
/*            for (i=0;i<num;i++)
                printf("%s ",arr[i]);
            printf("\n");*/
}

/**********************************************************************/
/*   Sort and rank an integer array                                   */
/*        arr -> the integer array                                    */
/*        ptr_arr -> an integer array of indexes into arr.            */
/*                   using this array to index arr, sorts the arr     */
/*        rank_arr -> an array of mean ranks of the elements in arr   */
/**********************************************************************/
void rank_int_arr(int *arr, int num, int *ptr_arr, double *rank_arr, int order)
{
    int i, j, tmp, count;


    sort_int_arr(arr, num, ptr_arr, order);

    /* mean rank the short arr                                 */
    /*    . . . the average of the ranks for duplicate numbers */
    for (j=0;j<num;j++){
        /*  if the next number is = the the current number */
        if ((j<num-1) && (arr[ptr_arr[j]] == arr[ptr_arr[j+1]])){
            /* find the last duplicate number */
            count = j;
            while((count < num-1) &&
                  (arr[ptr_arr[count]] == arr[ptr_arr[count+1]])){
                count++;
	    }
            /* count the number of duplicates */
            tmp = 0;
            for (i=j;i<count+1;i++)
                tmp+=i;
            /* install the averages in all duplicates */
            for (i=j;i<count+1;i++)
                rank_arr[ptr_arr[i]] = (double)tmp/(double)(count+1-j) + 1.0;
            /* go the the end of the duplicates */
            j=i-1;
	}
        else{
            /* no duplicates, use the index as the rank */
            rank_arr[ptr_arr[j]] = (double)(j+1);
	}
    }
}

/**********************************************************************/
/*   Sort and rank an double array                                     */
/*        arr -> the double array                                      */
/*        ptr_arr -> an integer array of indexes into arr.            */
/*                   using this array to index arr, sorts the arr     */
/*        rank_arr -> an array of mean ranks of the elements in arr   */
/*                                                                    */
/*  *** for comments, look up at sort_int_arr                         */
/*                                                                    */
/**********************************************************************/
void rank_double_arr(double *arr, int num, int *ptr_arr, double *rank_arr, int order)
{
    int i, j, tmp, count;

    sort_double_arr(arr, num, ptr_arr, order);

    for (j=0;j<num;j++){
        if ((j<num-1) && (arr[ptr_arr[j]] == arr[ptr_arr[j+1]])){
            count = j;
            while((count < num-1) &&
                  (arr[ptr_arr[count]] == arr[ptr_arr[count+1]])){
                count++;
	    }
            tmp = 0;
            for (i=j;i<count+1;i++)
                tmp+=i;
            for (i=j;i<count+1;i++)
                rank_arr[ptr_arr[i]] = (double)tmp/(double)(count+1-j) + 1.0;
            j=i-1;
	}
        else{
            rank_arr[ptr_arr[j]] = (double)(j+1);
	}
    }
}