liblept/numafunc1.c - platform/external/tesseract - Git at Google

 /*====================================================================*
  -  Copyright (C) 2001 Leptonica.  All rights reserved.
  -  This software is distributed in the hope that it will be
  -  useful, but with NO WARRANTY OF ANY KIND.
  -  No author or distributor accepts responsibility to anyone for the
  -  consequences of using this software, or for whether it serves any
  -  particular purpose or works at all, unless he or she says so in
  -  writing.  Everyone is granted permission to copy, modify and
  -  redistribute this source code, for commercial or non-commercial
  -  purposes, with the following restrictions: (1) the origin of this
  -  source code must not be misrepresented; (2) modified versions must
  -  be plainly marked as such; and (3) this notice may not be removed
  -  or altered from any source or modified source distribution.
  *====================================================================*/

 /*
  *   numafunc1.c
  *
  *      Arithmetic and logic
  *          NUMA        *numaArithOp()
  *          NUMA        *numaLogicalOp()
  *          NUMA        *numaInvert()
  *
  *      Simple extractions
  *          l_int32      numaGetMin()
  *          l_int32      numaGetMax()
  *          l_int32      numaGetSum()
  *          NUMA        *numaGetPartialSums()
  *          l_int32      numaGetSumOnInterval()
  *          l_int32      numaHasOnlyIntegers()
  *          NUMA        *numaSubsample()
  *          NUMA        *numaMakeSequence()
  *          NUMA        *numaMakeConstant()
  *          l_int32      numaGetNonzeroRange()
  *          l_int32      numaGetCountRelativeToZero()
  *          NUMA        *numaClipToInterval()
  *          NUMA        *numaMakeThresholdIndicator()
  *
  *      Interpolation
  *          l_int32      numaInterpolateEqxVal()
  *          l_int32      numaInterpolateEqxInterval()
  *          l_int32      numaInterpolateArbxVal()
  *          l_int32      numaInterpolateArbxInterval()
  *
  *      Functions requiring interpolation
  *          l_int32      numaFitMax()
  *          l_int32      numaDifferentiateInterval()
  *          l_int32      numaIntegrateInterval()
  *
  *      Sorting
  *          NUMA        *numaSort()
  *          NUMA        *numaGetSortIndex()
  *          NUMA        *numaSortByIndex()
  *          l_int32      numaIsSorted()
  *          l_int32      numaSortPair()
  *          NUMA        *numaPseudorandomSequence()
  *
  *      Functions requiring sorting
  *          l_int32      numaGetMedian()
  *          l_int32      numaGetMode()
  *
  *      Numa combination
  *          l_int32      numaJoin()
  *          NUMA        *numaaFlattenToNuma()
  *
  *
  *    Things to remember when using the Numa:
  *
  *    (1) The numa is a struct, not an array.  Always use accessors
  *        (see numabasic.c), never the fields directly.
  *
  *    (2) The number array holds l_float32 values.  It can also
  *        be used to store l_int32 values.  See numabasic.c for
  *        details on using the accessors.
  *
  *    (3) If you use numaCreate(), no numbers are stored and the size is 0.
  *        You have to add numbers to increase the size.
  *        If you want to start with a numa of a fixed size, with each
  *        entry initialized to the same value, use numaMakeConstant().
  *
  *    (4) Occasionally, in the comments we denote the i-th element of a
  *        numa by na[i].  This is conceptual only -- the numa is not an array!
  */

 #include <stdio.h>
 #include <string.h>
 #include <stdlib.h>
 #include <math.h>
 #include "allheaders.h"


 /*----------------------------------------------------------------------*
  *                Arithmetic and logical ops on Numas                   *
  *----------------------------------------------------------------------*/
 /*!
  *  numaArithOp()
  *
  *      Input:  nad (<optional> can be null or equal to na1 (in-place)
  *              na1
  *              na2
  *              op (L_ARITH_ADD, L_ARITH_SUBTRACT,
  *                  L_ARITH_MULTIPLY, L_ARITH_DIVIDE)
  *      Return: nad (always: operation applied to na1 and na2)
  *
  *  Notes:
  *      (1) The sizes of na1 and na2 must be equal.
  *      (2) nad can only null or equal to na1.
  *      (3) To add a constant to a numa, or to multipy a numa by
  *          a constant, use numaTransform().
  */
 NUMA *
 numaArithOp(NUMA    *nad,
             NUMA    *na1,
             NUMA    *na2,
             l_int32  op)
 {
 l_int32    i, n;
 l_float32  val1, val2;

     PROCNAME("numaArithOp");

     if (!na1 || !na2)
         return (NUMA *)ERROR_PTR("na1, na2 not both defined", procName, nad);
     n = numaGetCount(na1);
     if (n != numaGetCount(na2))
         return (NUMA *)ERROR_PTR("na1, na2 sizes differ", procName, nad);
     if (nad && nad != na1)
         return (NUMA *)ERROR_PTR("nad defined but not in-place", procName, nad);
     if (op != L_ARITH_ADD && op != L_ARITH_SUBTRACT &&
         op != L_ARITH_MULTIPLY && op != L_ARITH_DIVIDE)
         return (NUMA *)ERROR_PTR("invalid op", procName, nad);
     if (op == L_ARITH_DIVIDE) {
         for (i = 0; i < n; i++) {
             numaGetFValue(na2, i, &val2);
             if (val2 == 0.0)
                 return (NUMA *)ERROR_PTR("na2 has 0 element", procName, nad);
         }
     }

         /* If nad is not identical to na1, make it an identical copy */
     if (!nad)
         nad = numaCopy(na1);

     for (i = 0; i < n; i++) {
         numaGetFValue(nad, i, &val1);
         numaGetFValue(na2, i, &val2);
         switch (op) {
         case L_ARITH_ADD:
             numaSetValue(nad, i, val1 + val2);
             break;
         case L_ARITH_SUBTRACT:
             numaSetValue(nad, i, val1 - val2);
             break;
         case L_ARITH_MULTIPLY:
             numaSetValue(nad, i, val1 * val2);
             break;
         case L_ARITH_DIVIDE:
             numaSetValue(nad, i, val1 / val2);
             break;
         default:
             fprintf(stderr, " Unknown arith op: %d\n", op);
             return nad;
         }
     }

     return nad;
 }


 /*!
  *  numaLogicalOp()
  *
  *      Input:  nad (<optional> can be null or equal to na1 (in-place)
  *              na1
  *              na2
  *              op (L_UNION, L_INTERSECTION, L_SUBTRACTION, L_EXCLUSIVE_OR)
  *      Return: nad (always: operation applied to na1 and na2)
  *
  *  Notes:
  *      (1) The sizes of na1 and na2 must be equal.
  *      (2) nad can only null or equal to na1.
  *      (3) This is intended for use with indicator arrays (0s and 1s).
  *          Input data is extracted as integers (0 == false, anything
  *          else == true); output results are 0 and 1.
  *      (4) L_SUBTRACTION is subtraction of val2 from val1.  For bit logical
  *          arithmetic this is (val1 & ~val2), but because these values
  *          are integers, we use (val1 && !val2).
  */
 NUMA *
 numaLogicalOp(NUMA    *nad,
               NUMA    *na1,
               NUMA    *na2,
               l_int32  op)
 {
 l_int32  i, n, val1, val2, val;

     PROCNAME("numaLogicalOp");

     if (!na1 || !na2)
         return (NUMA *)ERROR_PTR("na1, na2 not both defined", procName, nad);
     n = numaGetCount(na1);
     if (n != numaGetCount(na2))
         return (NUMA *)ERROR_PTR("na1, na2 sizes differ", procName, nad);
     if (nad && nad != na1)
         return (NUMA *)ERROR_PTR("nad defined; not in-place", procName, nad);
     if (op != L_UNION && op != L_INTERSECTION &&
         op != L_SUBTRACTION && op != L_EXCLUSIVE_OR)
         return (NUMA *)ERROR_PTR("invalid op", procName, nad);

         /* If nad is not identical to na1, make it an identical copy */
     if (!nad)
         nad = numaCopy(na1);

     for (i = 0; i < n; i++) {
         numaGetIValue(nad, i, &val1);
         numaGetIValue(na2, i, &val2);
         switch (op) {
         case L_UNION:
             val = (val1 || val2) ? 1 : 0;
             numaSetValue(nad, i, val);
             break;
         case L_INTERSECTION:
             val = (val1 && val2) ? 1 : 0;
             numaSetValue(nad, i, val);
             break;
         case L_SUBTRACTION:
             val = (val1 && !val2) ? 1 : 0;
             numaSetValue(nad, i, val);
             break;
         case L_EXCLUSIVE_OR:
             val = ((val1 && !val2) || (!val1 && val2)) ? 1 : 0;
             numaSetValue(nad, i, val);
             break;
         default:
             fprintf(stderr, " Unknown logical op: %d\n", op);
             return nad;
         }
     }

     return nad;
 }


 /*!
  *  numaInvert()
  *
  *      Input:  nad (<optional> can be null or equal to nas (in-place)
  *              nas
  *      Return: nad (always: 'inverts' nas)
  *
  *  Notes:
  *      (1) This is intended for use with indicator arrays (0s and 1s).
  *          It gives a boolean-type output, taking the input as
  *          an integer and inverting it:
  *              0              -->  1
  *              anything else  -->   0
  */
 NUMA *
 numaInvert(NUMA  *nad,
            NUMA  *nas)
 {
 l_int32  i, n, val;

     PROCNAME("numaInvert");

     if (!nas)
         return (NUMA *)ERROR_PTR("nas not defined", procName, nad);
     if (nad && nad != nas)
         return (NUMA *)ERROR_PTR("nad defined; not in-place", procName, nad);

     if (!nad)
         nad = numaCopy(nas);
     n = numaGetCount(nad);
     for (i = 0; i < n; i++) {
         numaGetIValue(nad, i, &val);
         if (!val)
             val = 1;
         else
             val = 0;
         numaSetValue(nad, i, val);
     }

     return nad;
 }


 /*----------------------------------------------------------------------*
  *                         Simple extractions                           *
  *----------------------------------------------------------------------*/
 /*!
  *  numaGetMin()
  *
  *      Input:  na
  *              &minval (<optional return> min value)
  *              &iminloc (<optional return> index of min location)
  *      Return: 0 if OK; 1 on error
  */
 l_int32
 numaGetMin(NUMA       *na,
            l_float32  *pminval,
            l_int32    *piminloc)
 {
 l_int32    i, n, iminloc;
 l_float32  val, minval;

     PROCNAME("numaGetMin");

     if (!pminval && !piminloc)
         return ERROR_INT("nothing to do", procName, 1);
     if (pminval) *pminval = 0.0;
     if (piminloc) *piminloc = 0;
     if (!na)
         return ERROR_INT("na not defined", procName, 1);

     minval = +1000000000.;
     iminloc = 0;
     n = numaGetCount(na);
     for (i = 0; i < n; i++) {
         numaGetFValue(na, i, &val);
         if (val < minval) {
             minval = val;
             iminloc = i;
         }
     }

     if (pminval) *pminval = minval;
     if (piminloc) *piminloc = iminloc;
     return 0;
 }


 /*!
  *  numaGetMax()
  *
  *      Input:  na
  *              &maxval (<optional return> max value)
  *              &imaxloc (<optional return> index of max location)
  *      Return: 0 if OK; 1 on error
  */
 l_int32
 numaGetMax(NUMA       *na,
            l_float32  *pmaxval,
            l_int32    *pimaxloc)
 {
 l_int32    i, n, imaxloc;
 l_float32  val, maxval;

     PROCNAME("numaGetMax");

     if (!pmaxval && !pimaxloc)
         return ERROR_INT("nothing to do", procName, 1);
     if (pmaxval) *pmaxval = 0.0;
     if (pimaxloc) *pimaxloc = 0;
     if (!na)
         return ERROR_INT("na not defined", procName, 1);

     maxval = -1000000000.;
     imaxloc = 0;
     n = numaGetCount(na);
     for (i = 0; i < n; i++) {
         numaGetFValue(na, i, &val);
         if (val > maxval) {
             maxval = val;
             imaxloc = i;
         }
     }

     if (pmaxval) *pmaxval = maxval;
     if (pimaxloc) *pimaxloc = imaxloc;
     return 0;
 }


 /*!
  *  numaGetSum()
  *
  *      Input:  na
  *              &sum (<return> sum of values)
  *      Return: 0 if OK, 1 on error
  */
 l_int32
 numaGetSum(NUMA       *na,
            l_float32  *psum)
 {
 l_int32    i, n;
 l_float32  val, sum;

     PROCNAME("numaGetSum");

     if (!na)
         return ERROR_INT("na not defined", procName, 1);
     if (!psum)
         return ERROR_INT("&sum not defined", procName, 1);

     sum = 0.0;
     n = numaGetCount(na);
     for (i = 0; i < n; i++) {
         numaGetFValue(na, i, &val);
         sum += val;
     }
     *psum = sum;
     return 0;
 }


 /*!
  *  numaGetPartialSums()
  *
  *      Input:  na
  *      Return: nasum, or null on error
  *
  *  Notes:
  *      (1) nasum[i] is the sum for all j <= i of na[j].
  *          So nasum[0] = na[0].
  *      (2) If you want to generate a rank function, where rank[0] - 0.0,
  *          insert a 0.0 at the beginning of the nasum array.
  */
 NUMA *
 numaGetPartialSums(NUMA  *na)
 {
 l_int32    i, n;
 l_float32  val, sum;
 NUMA      *nasum;

     PROCNAME("numaGetPartialSums");

     if (!na)
         return (NUMA *)ERROR_PTR("na not defined", procName, NULL);

     n = numaGetCount(na);
     nasum = numaCreate(n);
     sum = 0.0;
     for (i = 0; i < n; i++) {
         numaGetFValue(na, i, &val);
         sum += val;
         numaAddNumber(nasum, sum);
     }
     return nasum;
 }


 /*!
  *  numaGetSumOnInterval()
  *
  *      Input:  na
  *              first (beginning index)
  *              last (final index)
  *              &sum (<return> sum of values in the index interval range)
  *      Return: 0 if OK, 1 on error
  */
 l_int32
 numaGetSumOnInterval(NUMA       *na,
                      l_int32     first,
                      l_int32     last,
                      l_float32  *psum)
 {
 l_int32    i, n, truelast;
 l_float32  val, sum;

     PROCNAME("numaGetSumOnInterval");

     if (!na)
         return ERROR_INT("na not defined", procName, 1);
     if (!psum)
         return ERROR_INT("&sum not defined", procName, 1);
     *psum = 0.0;

     sum = 0.0;
     n = numaGetCount(na);
     if (first >= n)  /* not an error */
       return 0;
     truelast = L_MIN(last, n - 1);

     for (i = first; i <= truelast; i++) {
         numaGetFValue(na, i, &val);
         sum += val;
     }
     *psum = sum;
     return 0;
 }


 /*!
  *  numaHasOnlyIntegers()
  *
  *      Input:  na
  *              maxsamples (maximum number of samples to check)
  *              &allints (<return> 1 if all sampled values are ints; else 0)
  *      Return: 0 if OK, 1 on error
  *
  *  Notes:
  *      (1) Set @maxsamples == 0 to check every integer in na.  Otherwise,
  *          this samples no more than @maxsamples.
  */
 l_int32
 numaHasOnlyIntegers(NUMA     *na,
                     l_int32   maxsamples,
                     l_int32  *pallints)
 {
 l_int32    i, n, incr;
 l_float32  val;

     PROCNAME("numaHasOnlyIntegers");

     if (!pallints)
         return ERROR_INT("&allints not defined", procName, 1);
     *pallints = TRUE;
     if (!na)
         return ERROR_INT("na not defined", procName, 1);

     if ((n = numaGetCount(na)) == 0)
         return ERROR_INT("na empty", procName, 1);
     if (maxsamples <= 0)
         incr = 1;
     else
         incr = (l_int32)((n + maxsamples - 1) / maxsamples);
     for (i = 0; i < n; i += incr) {
         numaGetFValue(na, i, &val);
         if (val != (l_int32)val) {
             *pallints = FALSE;
             return 0;
         }
     }

     return 0;
 }


 /*!
  *  numaSubsample()
  *
  *      Input:  nas
  *              subfactor (subsample factor, >= 1)
  *      Return: nad (evenly sampled values from nas), or null on error
  */
 NUMA *
 numaSubsample(NUMA    *nas,
               l_int32  subfactor)
 {
 l_int32    i, n;
 l_float32  val;
 NUMA      *nad;

     PROCNAME("numaSubsample");

     if (!nas)
         return (NUMA *)ERROR_PTR("nas not defined", procName, NULL);
     if (subfactor < 1)
         return (NUMA *)ERROR_PTR("subfactor < 1", procName, NULL);

     nad = numaCreate(0);
     n = numaGetCount(nas);
     for (i = 0; i < n; i++) {
         if (i % subfactor != 0) continue;
         numaGetFValue(nas, i, &val);
         numaAddNumber(nad, val);
     }

     return nad;
 }


 /*!
  *  numaMakeSequence()
  *
  *      Input:  startval
  *              increment
  *              size (of sequence)
  *      Return: numa of sequence of evenly spaced values, or null on error
  */
 NUMA *
 numaMakeSequence(l_float32  startval,
                  l_float32  increment,
                  l_int32    size)
 {
 l_int32    i;
 l_float32  val;
 NUMA      *na;

     PROCNAME("numaMakeSequence");

     if ((na = numaCreate(size)) == NULL)
         return (NUMA *)ERROR_PTR("na not made", procName, NULL);

     for (i = 0; i < size; i++) {
         val = startval + i * increment;
         numaAddNumber(na, val);
     }

     return na;
 }


 /*!
  *  numaMakeConstant()
  *
  *      Input:  val
  *              size (of numa)
  *      Return: numa of given size with all entries equal to 'val',
  *              or null on error
  */
 NUMA *
 numaMakeConstant(l_float32  val,
                  l_int32    size)
 {
     return numaMakeSequence(val, 0.0, size);
 }


 /*!
  *  numaGetNonzeroRange()
  *
  *      Input:  numa
  *              eps (largest value considered to be zero)
  *              &first, &last (<return> interval of array indices
  *                             where values are nonzero)
  *      Return: 0 if OK, 1 on error or if no nonzero range is found.
  */
 l_int32
 numaGetNonzeroRange(NUMA      *na,
                     l_float32  eps,
                     l_int32   *pfirst,
                     l_int32   *plast)
 {
 l_int32    n, i, found;
 l_float32  val;

     PROCNAME("numaGetNonzeroRange");

     if (!na)
         return ERROR_INT("na not defined", procName, 1);
     if (!pfirst || !plast)
         return ERROR_INT("pfirst and plast not both defined", procName, 1);
     n = numaGetCount(na);
     found = FALSE;
     for (i = 0; i < n; i++) {
         numaGetFValue(na, i, &val);
         if (val > eps) {
             found = TRUE;
             break;
         }
     }
     if (!found) {
         *pfirst = n - 1;
         *plast = 0;
         return 1;
     }

     *pfirst = i;
     for (i = n - 1; i >= 0; i--) {
         numaGetFValue(na, i, &val);
         if (val > eps)
             break;
     }
     *plast = i;
     return 0;
 }


 /*!
  *  numaGetCountRelativeToZero()
  *
  *      Input:  numa
  *              type (L_LESS_THAN_ZERO, L_EQUAL_TO_ZERO, L_GREATER_THAN_ZERO)
  *              &count (<return> count of values of given type)
  *      Return: 0 if OK, 1 on error
  */
 l_int32
 numaGetCountRelativeToZero(NUMA     *na,
                            l_int32   type,
                            l_int32  *pcount)
 {
 l_int32    n, i, count;
 l_float32  val;

     PROCNAME("numaGetCountRelativeToZero");

     if (!pcount)
         return ERROR_INT("&count not defined", procName, 1);
     *pcount = 0;
     if (!na)
         return ERROR_INT("na not defined", procName, 1);
     n = numaGetCount(na);
     for (i = 0, count = 0; i < n; i++) {
         numaGetFValue(na, i, &val);
         if (type == L_LESS_THAN_ZERO && val < 0.0)
             count++;
         else if (type == L_EQUAL_TO_ZERO && val == 0.0)
             count++;
         else if (type == L_GREATER_THAN_ZERO && val > 0.0)
             count++;
     }

     *pcount = count;
     return 0;
 }


 /*!
  *  numaClipToInterval()
  *
  *      Input:  numa
  *              first, last (clipping interval)
  *      Return: numa with the same values as the input, but clipped
  *              to the specified interval
  *
  *  Note: If you want the indices of the array values to be unchanged,
  *        use first = 0.
  *  Usage: This is useful to clip a histogram that has a few nonzero
  *         values to its nonzero range.
  */
 NUMA *
 numaClipToInterval(NUMA    *nas,
                    l_int32  first,
                    l_int32  last)
 {
 l_int32    n, i, truelast;
 l_float32  val;
 NUMA      *nad;

     PROCNAME("numaClipToInterval");

     if (!nas)
         return (NUMA *)ERROR_PTR("nas not defined", procName, NULL);
     if (first > last)
         return (NUMA *)ERROR_PTR("range not valid", procName, NULL);

     n = numaGetCount(nas);
     if (first >= n)
         return (NUMA *)ERROR_PTR("no elements in range", procName, NULL);
     truelast = L_MIN(last, n - 1);
     if ((nad = numaCreate(truelast - first + 1)) == NULL)
         return (NUMA *)ERROR_PTR("nad not made", procName, NULL);
     for (i = first; i <= truelast; i++) {
         numaGetFValue(nas, i, &val);
         numaAddNumber(nad, val);
     }

     return nad;
 }


 /*!
  *  numaMakeThresholdIndicator()
  *
  *      Input:  nas (input numa)
  *              thresh (threshold value)
  *              type (L_SELECT_IF_LT, L_SELECT_IF_GT,
  *                    L_SELECT_IF_LTE, L_SELECT_IF_GTE)
  *      Output: nad (indicator array: values are 0 and 1)
  *
  *  Notes:
  *      (1) For each element in nas, if the constraint given by 'type'
  *          correctly specifies its relation to thresh, a value of 1
  *          is recorded in nad.
  */
 NUMA *
 numaMakeThresholdIndicator(NUMA      *nas,
                            l_float32  thresh,
                            l_int32    type)
 {
 l_int32    n, i, ival;
 l_float32  fval;
 NUMA      *nai;

     PROCNAME("numaMakeThresholdIndicator");

     n = numaGetCount(nas);
     nai = numaCreate(n);
     for (i = 0; i < n; i++) {
         numaGetFValue(nas, i, &fval);
         ival = 0;
         switch (type)
         {
         case L_SELECT_IF_LT:
             if (fval < thresh) ival = 1;
             break;
         case L_SELECT_IF_GT:
             if (fval > thresh) ival = 1;
             break;
         case L_SELECT_IF_LTE:
             if (fval <= thresh) ival = 1;
             break;
         case L_SELECT_IF_GTE:
             if (fval >= thresh) ival = 1;
             break;
         default:
             numaDestroy(&nai);
             return (NUMA *)ERROR_PTR("invalid type", procName, NULL);
         }
         numaAddNumber(nai, ival);
     }

     return nai;
 }


 /*----------------------------------------------------------------------*
  *                             Interpolation                            *
  *----------------------------------------------------------------------*/
 /*!
  *  numaInterpolateEqxVal()
  *
  *      Input:  startx (xval corresponding to first element in array)
  *              deltax (x increment between array elements)
  *              nay  (numa of ordinate values, assumed equally spaced)
  *              type (L_LINEAR_INTERP, L_QUADRATIC_INTERP)
  *              xval
  *              &yval (<return> interpolated value)
  *      Return: 0 if OK, 1 on error (e.g., if xval is outside range)
  *
  *  Notes:
  *      (1) Considering nay as a function of x, the x values
  *          are equally spaced
  *      (2) Caller should check for valid return.
  *
  *  For linear Lagrangian interpolation (through 2 data pts):
  *         y(x) = y1(x-x2)/(x1-x2) + y2(x-x1)/(x2-x1)
  *
  *  For quadratic Lagrangian interpolation (through 3 data pts):
  *         y(x) = y1(x-x2)(x-x3)/((x1-x2)(x1-x3)) +
  *                y2(x-x1)(x-x3)/((x2-x1)(x2-x3)) +
  *                y3(x-x1)(x-x2)/((x3-x1)(x3-x2))
  *
  */
 l_int32
 numaInterpolateEqxVal(l_float32   startx,
                       l_float32   deltax,
 		      NUMA       *nay,
                       l_int32     type,
                       l_float32   xval,
                       l_float32  *pyval)
 {
 l_int32     i, n, i1, i2, i3;
 l_float32   x1, x2, x3, fy1, fy2, fy3, d1, d2, d3, del, fi, maxx;
 l_float32  *fa;

     PROCNAME("numaInterpolateEqxVal");

     if (!pyval)
         return ERROR_INT("&yval not defined", procName, 1);
     *pyval = 0.0;
     if (!nay)
         return ERROR_INT("nay not defined", procName, 1);
     if (deltax <= 0.0)
         return ERROR_INT("deltax not > 0", procName, 1);
     if (type != L_LINEAR_INTERP && type != L_QUADRATIC_INTERP)
         return ERROR_INT("invalid interp type", procName, 1);
     n = numaGetCount(nay);
     if (n < 2)
         return ERROR_INT("not enough points", procName, 1);
     if (type == L_QUADRATIC_INTERP && n == 2) {
         type = L_LINEAR_INTERP;
         L_WARNING("only 2 points; using linear interp", procName);
     }
     maxx = startx + deltax * (n - 1);
     if (xval < startx || xval > maxx)
         return ERROR_INT("xval is out of bounds", procName, 1);

     fa = numaGetFArray(nay, L_NOCOPY);
     fi = (xval - startx) / deltax;
     i = (l_int32)fi;
     del = fi - i;
     if (del == 0.0) {  /* no interpolation required */
         *pyval = fa[i];
 	return 0;
     }

     if (type == L_LINEAR_INTERP) {
         *pyval = fa[i] + del * (fa[i + 1] - fa[i]);
 	return 0;
     }

         /* Quadratic interpolation */
     d1 = d3 = 0.5 / (deltax * deltax);
     d2 = -2. * d1;
     if (i == 0) {
         i1 = i;
 	i2 = i + 1;
 	i3 = i + 2;
     }
     else {
         i1 = i - 1;
 	i2 = i;
 	i3 = i + 1;
     }
     x1 = startx + i1 * deltax;
     x2 = startx + i2 * deltax;
     x3 = startx + i3 * deltax;
     fy1 = d1 * fa[i1];
     fy2 = d2 * fa[i2];
     fy3 = d3 * fa[i3];
     *pyval = fy1 * (xval - x2) * (xval - x3) +
              fy2 * (xval - x1) * (xval - x3) +
              fy3 * (xval - x1) * (xval - x2);
     return 0;
 }


 /*!
  *  numaInterpolateArbxVal()
  *
  *      Input:  nax (numa of abscissa values)
  *              nay (numa of ordinate values, corresponding to nax)
  *              type (L_LINEAR_INTERP, L_QUADRATIC_INTERP)
  *              xval
  *              &yval (<return> interpolated value)
  *      Return: 0 if OK, 1 on error (e.g., if xval is outside range)
  *
  *  Notes:
  *      (1) The values in nax must be sorted in increasing order.
  *          If, additionally, they are equally spaced, you can use
  *          numaInterpolateEqxVal().
  *      (2) Caller should check for valid return.
  *      (3) Uses lagrangian interpolation.  See numaInterpolateEqxVal()
  *          for formulas.
  */
 l_int32
 numaInterpolateArbxVal(NUMA       *nax,
                        NUMA       *nay,
                        l_int32     type,
                        l_float32   xval,
                        l_float32  *pyval)
 {
 l_int32     i, im, nx, ny, i1, i2, i3;
 l_float32   delu, dell, fract, d1, d2, d3;
 l_float32   minx, maxx;
 l_float32  *fax, *fay;

     PROCNAME("numaInterpolateArbxVal");

     if (!pyval)
         return ERROR_INT("&yval not defined", procName, 1);
     *pyval = 0.0;
     if (!nax)
         return ERROR_INT("nax not defined", procName, 1);
     if (!nay)
         return ERROR_INT("nay not defined", procName, 1);
     if (type != L_LINEAR_INTERP && type != L_QUADRATIC_INTERP)
         return ERROR_INT("invalid interp type", procName, 1);
     ny = numaGetCount(nay);
     nx = numaGetCount(nax);
     if (nx != ny)
         return ERROR_INT("nax and nay not same size arrays", procName, 1);
     if (ny < 2)
         return ERROR_INT("not enough points", procName, 1);
     if (type == L_QUADRATIC_INTERP && ny == 2) {
         type = L_LINEAR_INTERP;
         L_WARNING("only 2 points; using linear interp", procName);
     }
     numaGetFValue(nax, 0, &minx);
     numaGetFValue(nax, nx - 1, &maxx);
     if (xval < minx || xval > maxx)
         return ERROR_INT("xval is out of bounds", procName, 1);

     fax = numaGetFArray(nax, L_NOCOPY);
     fay = numaGetFArray(nay, L_NOCOPY);

         /* Linear search for interval.  We are guaranteed
          * to either return or break out of the loop.
          * In addition, we are assured that fax[i] - fax[im] > 0.0 */
     if (xval == fax[0]) {
         *pyval = fay[0];
         return 0;
     }
     for (i = 1; i < nx; i++) {
         delu = fax[i] - xval;
 	if (delu >= 0.0) {  /* we've passed it */
             if (delu == 0.0) {
                 *pyval = fay[i];
                 return 0;
             }
             im = i - 1;
             dell = xval - fax[im];  /* >= 0 */
             break;
         }
     }
     fract = dell / (fax[i] - fax[im]);

     if (type == L_LINEAR_INTERP) {
         *pyval = fay[i] + fract * (fay[i + 1] - fay[i]);
 	return 0;
     }

         /* Quadratic interpolation */
     if (im == 0) {
         i1 = im;
 	i2 = im + 1;
 	i3 = im + 2;
     }
     else {
         i1 = im - 1;
 	i2 = im;
 	i3 = im + 1;
     }
     d1 = (fax[i1] - fax[i2]) * (fax[i1] - fax[i3]);
     d2 = (fax[i2] - fax[i1]) * (fax[i2] - fax[i3]);
     d3 = (fax[i3] - fax[i1]) * (fax[i3] - fax[i2]);
     *pyval = fay[i1] * (xval - fax[i2]) * (xval - fax[i3]) / d1 +
              fay[i2] * (xval - fax[i1]) * (xval - fax[i3]) / d2 +
              fay[i3] * (xval - fax[i1]) * (xval - fax[i2]) / d3;
     return 0;
 }


 /*!
  *  numaInterpolateEqxInterval()
  *
  *      Input:  startx (xval corresponding to first element in nas)
  *              deltax (x increment between array elements in nas)
  *              nasy  (numa of ordinate values, assumed equally spaced)
  *              type (L_LINEAR_INTERP, L_QUADRATIC_INTERP)
  *              x0 (start value of interval)
  *              x1 (end value of interval)
  *              npts (number of points to evaluate function in interval)
  *              &nax (<optional return> array of x values in interval)
  *              &nay (<return> array of y values in interval)
  *      Return: 0 if OK, 1 on error
  *
  *  Notes:
  *      (1) Considering nasy as a function of x, the x values
  *          are equally spaced.
  *      (2) This creates nay (and optionally nax) of interpolated
  *          values over the specified interval (x0, x1).
  *      (3) If the interval (x0, x1) lies partially outside the array
  *          nasy (as interpreted by startx and deltax), it is an
  *          error and returns 1.
  *      (4) Note that deltax is the intrinsic x-increment for the input
  *          array nasy, whereas delx is the intrinsic x-increment for the
  *          output interpolated array nay.
  */
 l_int32
 numaInterpolateEqxInterval(l_float32  startx,
                            l_float32  deltax,
                            NUMA      *nasy,
                            l_int32    type,
                            l_float32  x0,
                            l_float32  x1,
                            l_int32    npts,
                            NUMA     **pnax,
                            NUMA     **pnay)
 {
 l_int32     i, n;
 l_float32   x, yval, maxx, delx;
 NUMA       *nax, *nay;

     PROCNAME("numaInterpolateEqxInterval");

     if (pnax) *pnax = NULL;
     if (!pnay)
         return ERROR_INT("&nay not defined", procName, 1);
     *pnay = NULL;
     if (!nasy)
         return ERROR_INT("nasy not defined", procName, 1);
     if (deltax <= 0.0)
         return ERROR_INT("deltax not > 0", procName, 1);
     if (type != L_LINEAR_INTERP && type != L_QUADRATIC_INTERP)
         return ERROR_INT("invalid interp type", procName, 1);
     n = numaGetCount(nasy);
     if (type == L_QUADRATIC_INTERP && n == 2) {
         type = L_LINEAR_INTERP;
         L_WARNING("only 2 points; using linear interp", procName);
     }
     maxx = startx + deltax * (n - 1);
     if (x0 < startx || x1 > maxx || x1 <= x0)
         return ERROR_INT("[x0 ... x1] is not valid", procName, 1);
     if (npts < 3)
         return ERROR_INT("npts < 3", procName, 1);
     delx = (x1 - x0) / (l_float32)(npts - 1);  /* delx is for output nay */

     if ((nay = numaCreate(npts)) == NULL)
         return ERROR_INT("nay not made", procName, 1);
     numaSetXParameters(nay, x0, delx);
     *pnay = nay;
     if (pnax) {
         nax = numaCreate(npts);
 	*pnax = nax;
     }

     for (i = 0; i < npts; i++) {
         x = x0 + i * delx;
         if (pnax)
             numaAddNumber(nax, x);
         numaInterpolateEqxVal(startx, deltax, nasy, type, x, &yval);
 	numaAddNumber(nay, yval);
     }

     return 0;
 }


 /*!
  *  numaInterpolateArbxInterval()
  *
  *      Input:  nax (numa of abscissa values)
  *              nay (numa of ordinate values, corresponding to nax)
  *              type (L_LINEAR_INTERP, L_QUADRATIC_INTERP)
  *              x0 (start value of interval)
  *              x1 (end value of interval)
  *              npts (number of points to evaluate function in interval)
  *              &nadx (<optional return> array of x values in interval)
  *              &nady (<return> array of y values in interval)
  *      Return: 0 if OK, 1 on error (e.g., if x0 or x1 is outside range)
  *
  *  Notes:
  *      (1) The values in nax must be sorted in increasing order.
  *          If they are not sorted, we do it here, and complain.
  *      (2) If the values in nax are equally spaced, you can use
  *          numaInterpolateEqxInterval().
  *      (3) Caller should check for valid return.
  *      (4) We don't call numaInterpolateArbxVal() for each output
  *          point, because that requires an O(n) search for
  *          each point.  Instead, we do a single O(n) pass through
  *          nax, saving the indices to be used for each output yval.
  *      (5) Uses lagrangian interpolation.  See numaInterpolateEqxVal()
  *          for formulas.
  */
 l_int32
 numaInterpolateArbxInterval(NUMA       *nax,
                             NUMA       *nay,
                             l_int32     type,
                             l_float32   x0,
                             l_float32   x1,
                             l_int32     npts,
                             NUMA      **pnadx,
                             NUMA      **pnady)
 {
 l_int32     i, im, j, nx, ny, i1, i2, i3, sorted;
 l_int32    *index;
 l_float32   del, xval, yval, excess, fract, minx, maxx, d1, d2, d3;
 l_float32  *fax, *fay;
 NUMA       *nasx, *nasy, *nadx, *nady;

     PROCNAME("numaInterpolateArbxInterval");

     if (pnadx) *pnadx = NULL;
     if (!pnady)
         return ERROR_INT("&nady not defined", procName, 1);
     *pnady = NULL;
     if (!nay)
         return ERROR_INT("nay not defined", procName, 1);
     if (!nax)
         return ERROR_INT("nax not defined", procName, 1);
     if (type != L_LINEAR_INTERP && type != L_QUADRATIC_INTERP)
         return ERROR_INT("invalid interp type", procName, 1);
     if (x0 > x1)
         return ERROR_INT("x0 > x1", procName, 1);
     ny = numaGetCount(nay);
     nx = numaGetCount(nax);
     if (nx != ny)
         return ERROR_INT("nax and nay not same size arrays", procName, 1);
     if (ny < 2)
         return ERROR_INT("not enough points", procName, 1);
     if (type == L_QUADRATIC_INTERP && ny == 2) {
         type = L_LINEAR_INTERP;
         L_WARNING("only 2 points; using linear interp", procName);
     }
     numaGetMin(nax, &minx, NULL);
     numaGetMax(nax, &maxx, NULL);
     if (x0 < minx || x1 > maxx)
         return ERROR_INT("xval is out of bounds", procName, 1);

         /* Make sure that nax is sorted in increasing order */
     numaIsSorted(nax, L_SORT_INCREASING, &sorted);
     if (!sorted) {
         L_WARNING("we are sorting nax in increasing order", procName);
         numaSortPair(nax, nay, L_SORT_INCREASING, &nasx, &nasy);
     }
     else {
         nasx = numaClone(nax);
         nasy = numaClone(nay);
     }

     fax = numaGetFArray(nasx, L_NOCOPY);
     fay = numaGetFArray(nasy, L_NOCOPY);

         /* Get array of indices into fax for interpolated locations */
     if ((index = (l_int32 *)CALLOC(npts, sizeof(l_int32))) == NULL)
         return ERROR_INT("ind not made", procName, 1);
     del = (x1 - x0) / (npts - 1.0);
     for (i = 0, j = 0; j < nx && i < npts; i++) {
         xval = x0 + i * del;
         while (j < nx - 1 && xval > fax[j])
             j++;
         if (xval == fax[j])
             index[i] = L_MIN(j, nx - 1);
         else    /* the index of fax[] is just below xval */
             index[i] = L_MAX(j - 1, 0);
     }

         /* For each point to be interpolated, get the y value */
     nady = numaCreate(npts);
     *pnady = nady;
     if (pnadx) {
         nadx = numaCreate(npts);
 	*pnadx = nadx;
     }
     for (i = 0; i < npts; i++) {
         xval = x0 + i * del;
 	if (pnadx)
             numaAddNumber(nadx, xval);
 	im = index[i];
         excess = xval - fax[im];
 	if (excess == 0.0) {
             numaAddNumber(nady, fay[im]);
             continue;
         }
 	fract = excess / (fax[im + 1] - fax[im]);

         if (type == L_LINEAR_INTERP) {
             yval = fay[im] + fract * (fay[im + 1] - fay[im]);
             numaAddNumber(nady, yval);
 	    continue;
 	}

             /* Quadratic interpolation */
         if (im == 0) {
             i1 = im;
             i2 = im + 1;
             i3 = im + 2;
         }
         else {
             i1 = im - 1;
             i2 = im;
             i3 = im + 1;
         }
         d1 = (fax[i1] - fax[i2]) * (fax[i1] - fax[i3]);
         d2 = (fax[i2] - fax[i1]) * (fax[i2] - fax[i3]);
         d3 = (fax[i3] - fax[i1]) * (fax[i3] - fax[i2]);
         yval = fay[i1] * (xval - fax[i2]) * (xval - fax[i3]) / d1 +
                fay[i2] * (xval - fax[i1]) * (xval - fax[i3]) / d2 +
                fay[i3] * (xval - fax[i1]) * (xval - fax[i2]) / d3;
         numaAddNumber(nady, yval);
     }

     FREE(index);
     numaDestroy(&nasx);
     numaDestroy(&nasy);
     return 0;
 }


 /*----------------------------------------------------------------------*
  *                     Functions requiring interpolation                *
  *----------------------------------------------------------------------*/
 /*!
  *  numaFitMax()
  *
  *      Input:  na  (numa of ordinate values, to fit a max to)
  *              &maxval (<return> max value)
  *              naloc (<optional> associated numa of abscissa values)
  *              &maxloc (<return> abscissa value that gives max value in na;
  *                   if naloc == null, this is given as an interpolated
  *                   index value)
  *      Return: 0 if OK; 1 on error
  *
  *  Note: if naloc is given, there is no requirement that the
  *        data points are evenly spaced.  Lagrangian interpolation
  *        handles that.  The only requirement is that the
  *        data points are ordered so that the values in naloc
  *        are either increasing or decreasing.  We test to make
  *        sure that the sizes of na and naloc are equal, and it
  *        is assumed that the correspondences na[i] as a function
  *        of naloc[i] are properly arranged for all i.
  *
  *  The formula for Lagrangian interpolation through 3 data pts is:
  *       y(x) = y1(x-x2)(x-x3)/((x1-x2)(x1-x3)) +
  *              y2(x-x1)(x-x3)/((x2-x1)(x2-x3)) +
  *              y3(x-x1)(x-x2)/((x3-x1)(x3-x2))
  *
  *  Then the derivative, using the constants (c1,c2,c3) defined below,
  *  is set to 0:
  *       y'(x) = 2x(c1+c2+c3) - c1(x2+x3) - c2(x1+x3) - c3(x1+x2) = 0
  */
 l_int32
 numaFitMax(NUMA       *na,
            l_float32  *pmaxval,
            NUMA       *naloc,
            l_float32  *pmaxloc)
 {
 l_float32  val;
 l_float32  smaxval;  /* start value of maximum sample, before interpolating */
 l_int32    n, imaxloc;
 l_float32  x1, x2, x3, y1, y2, y3, c1, c2, c3, a, b, xmax, ymax;

     PROCNAME("numaFitMax");

     *pmaxval = *pmaxloc = 0.0;  /* init */

     if (!na)
         return ERROR_INT("na not defined", procName, 1);
     if (!pmaxval)
         return ERROR_INT("&maxval not defined", procName, 1);
     if (!pmaxloc)
         return ERROR_INT("&maxloc not defined", procName, 1);

     n = numaGetCount(na);
     if (naloc) {
         if (n != numaGetCount(naloc))
             return ERROR_INT("na and naloc of unequal size", procName, 1);
     }

     numaGetMax(na, &smaxval, &imaxloc);

         /* Simple case: max is at end point */
     if (imaxloc == 0 || imaxloc == n - 1) {
         *pmaxval = smaxval;
         if (naloc) {
             numaGetFValue(naloc, imaxloc, &val);
             *pmaxloc = val;
         }
         else
             *pmaxloc = imaxloc;
         return 0;
     }

         /* Interior point; use quadratic interpolation */
     y2 = smaxval;
     numaGetFValue(na, imaxloc - 1, &val);
     y1 = val;
     numaGetFValue(na, imaxloc + 1, &val);
     y3 = val;
     if (naloc) {
         numaGetFValue(naloc, imaxloc - 1, &val);
         x1 = val;
         numaGetFValue(naloc, imaxloc, &val);
         x2 = val;
         numaGetFValue(naloc, imaxloc + 1, &val);
         x3 = val;
     }
     else {
         x1 = imaxloc - 1;
         x2 = imaxloc;
         x3 = imaxloc + 1;
     }

         /* Can't interpolate; just use the max val in na
          * and the corresponding one in naloc */
     if (x1 == x2 || x1 == x3 || x2 == x3) {
         *pmaxval = y2;
         *pmaxloc = x2;
         return 0;
     }

         /* Use lagrangian interpolation; set dy/dx = 0 */
     c1 = y1 / ((x1 - x2) * (x1 - x3));
     c2 = y2 / ((x2 - x1) * (x2 - x3));
     c3 = y3 / ((x3 - x1) * (x3 - x2));
     a = c1 + c2 + c3;
     b = c1 * (x2 + x3) + c2 * (x1 + x3) + c3 * (x1 + x2);
     xmax = b / (2 * a);
     ymax = c1 * (xmax - x2) * (xmax - x3) +
            c2 * (xmax - x1) * (xmax - x3) +
            c3 * (xmax - x1) * (xmax - x2);
     *pmaxval = ymax;
     *pmaxloc = xmax;

     return 0;
 }


 /*!
  *  numaDifferentiateInterval()
  *
  *      Input:  nax (numa of abscissa values)
  *              nay (numa of ordinate values, corresponding to nax)
  *              x0 (start value of interval)
  *              x1 (end value of interval)
  *              npts (number of points to evaluate function in interval)
  *              &nadx (<optional return> array of x values in interval)
  *              &nady (<return> array of derivatives in interval)
  *      Return: 0 if OK, 1 on error (e.g., if x0 or x1 is outside range)
  *
  *  Notes:
  *      (1) The values in nax must be sorted in increasing order.
  *          If they are not sorted, it is done in the interpolation
  *          step, and a warning is issued.
  *      (2) Caller should check for valid return.
  */
 l_int32
 numaDifferentiateInterval(NUMA       *nax,
                           NUMA       *nay,
                           l_float32   x0,
                           l_float32   x1,
                           l_int32     npts,
                           NUMA      **pnadx,
                           NUMA      **pnady)
 {
 l_int32     i, nx, ny;
 l_float32   minx, maxx, der, invdel;
 l_float32  *fay;
 NUMA       *nady, *naiy;

     PROCNAME("numaDifferentiateInterval");

     if (pnadx) *pnadx = NULL;
     if (!pnady)
         return ERROR_INT("&nady not defined", procName, 1);
     *pnady = NULL;
     if (!nay)
         return ERROR_INT("nay not defined", procName, 1);
     if (!nax)
         return ERROR_INT("nax not defined", procName, 1);
     if (x0 > x1)
         return ERROR_INT("x0 > x1", procName, 1);
     ny = numaGetCount(nay);
     nx = numaGetCount(nax);
     if (nx != ny)
         return ERROR_INT("nax and nay not same size arrays", procName, 1);
     if (ny < 2)
         return ERROR_INT("not enough points", procName, 1);
     numaGetMin(nax, &minx, NULL);
     numaGetMax(nax, &maxx, NULL);
     if (x0 < minx || x1 > maxx)
         return ERROR_INT("xval is out of bounds", procName, 1);
     if (npts < 2)
         return ERROR_INT("npts < 2", procName, 1);

         /* Generate interpolated array over specified interval */
     if (numaInterpolateArbxInterval(nax, nay, L_LINEAR_INTERP, x0, x1,
                                     npts, pnadx, &naiy))
         return ERROR_INT("interpolation failed", procName, 1);

     nady = numaCreate(npts);
     *pnady = nady;
     invdel = 0.5 * ((l_float32)npts - 1.0) / (x1 - x0);
     fay = numaGetFArray(naiy, L_NOCOPY);

         /* Compute and save derivatives */
     der = 0.5 * invdel * (fay[1] - fay[0]);
     numaAddNumber(nady, der);
     for (i = 1; i < npts - 1; i++)  {
         der = invdel * (fay[i + 1] - fay[i - 1]);
         numaAddNumber(nady, der);
     }
     der = 0.5 * invdel * (fay[npts - 1] - fay[npts - 2]);
     numaAddNumber(nady, der);

     numaDestroy(&naiy);
     return 0;
 }


 /*!
  *  numaIntegrateInterval()
  *
  *      Input:  nax (numa of abscissa values)
  *              nay (numa of ordinate values, corresponding to nax)
  *              x0 (start value of interval)
  *              x1 (end value of interval)
  *              npts (number of points to evaluate function in interval)
  *              &sum (<return> integral of function over interval)
  *      Return: 0 if OK, 1 on error (e.g., if x0 or x1 is outside range)
  *
  *  Notes:
  *      (1) The values in nax must be sorted in increasing order.
  *          If they are not sorted, it is done in the interpolation
  *          step, and a warning is issued.
  *      (2) Caller should check for valid return.
  */
 l_int32
 numaIntegrateInterval(NUMA       *nax,
                       NUMA       *nay,
                       l_float32   x0,
                       l_float32   x1,
                       l_int32     npts,
                       l_float32  *psum)
 {
 l_int32     i, nx, ny;
 l_float32   minx, maxx, sum, del;
 l_float32  *fay;
 NUMA       *naiy;

     PROCNAME("numaIntegrateInterval");

     if (!psum)
         return ERROR_INT("&sum not defined", procName, 1);
     *psum = 0.0;
     if (!nay)
         return ERROR_INT("nay not defined", procName, 1);
     if (!nax)
         return ERROR_INT("nax not defined", procName, 1);
     if (x0 > x1)
         return ERROR_INT("x0 > x1", procName, 1);
     if (npts < 2)
         return ERROR_INT("npts < 2", procName, 1);
     ny = numaGetCount(nay);
     nx = numaGetCount(nax);
     if (nx != ny)
         return ERROR_INT("nax and nay not same size arrays", procName, 1);
     if (ny < 2)
         return ERROR_INT("not enough points", procName, 1);
     numaGetMin(nax, &minx, NULL);
     numaGetMax(nax, &maxx, NULL);
     if (x0 < minx || x1 > maxx)
         return ERROR_INT("xval is out of bounds", procName, 1);

         /* Generate interpolated array over specified interval */
     if (numaInterpolateArbxInterval(nax, nay, L_LINEAR_INTERP, x0, x1,
                                     npts, NULL, &naiy))
         return ERROR_INT("interpolation failed", procName, 1);

     del = (x1 - x0) / ((l_float32)npts - 1.0);
     fay = numaGetFArray(naiy, L_NOCOPY);

         /* Compute integral (simple trapezoid) */
     sum = 0.5 * (fay[0] + fay[npts - 1]);
     for (i = 1; i < npts - 1; i++)
         sum += fay[i];
     *psum = del * sum;

     numaDestroy(&naiy);
     return 0;
 }


 /*----------------------------------------------------------------------*
  *                                Sorting                               *
  *----------------------------------------------------------------------*/
 /*!
  *  numaSort()
  *
  *      Input:  naout (output numa; can be NULL or equal to nain)
  *              nain (input numa)
  *              sortorder (L_SORT_INCREASING or L_SORT_DECREASING)
  *      Return: naout (output sorted numa), or null on error
  *
  *  Notes:
  *      (1) Set naout = nain for in-place; otherwise, set naout = NULL.
  *      (2) Source: Shell sort, modified from K&R, 2nd edition, p.62.
  *          Slow but simple O(n logn) sort.
  */
 NUMA *
 numaSort(NUMA    *naout,
          NUMA    *nain,
          l_int32  sortorder)
 {
 l_int32     i, n, gap, j;
 l_float32   tmp;
 l_float32  *array;

     PROCNAME("numaSort");

     if (!nain)
         return (NUMA *)ERROR_PTR("nain not defined", procName, NULL);

         /* Make naout if necessary; otherwise do in-place */
     if (!naout)
         naout = numaCopy(nain);
     else if (nain != naout)
         return (NUMA *)ERROR_PTR("invalid: not in-place", procName, NULL);
     array = naout->array;  /* operate directly on the array */
     n = numaGetCount(naout);

         /* Shell sort */
     for (gap = n/2; gap > 0; gap = gap / 2) {
         for (i = gap; i < n; i++) {
             for (j = i - gap; j >= 0; j -= gap) {
                 if ((sortorder == L_SORT_INCREASING &&
                      array[j] > array[j + gap]) ||
                     (sortorder == L_SORT_DECREASING &&
                      array[j] < array[j + gap]))
                 {
                     tmp = array[j];
                     array[j] = array[j + gap];
                     array[j + gap] = tmp;
                 }
             }
         }
     }

     return naout;
 }


 /*!
  *  numaGetSortIndex()
  *
  *      Input:  na
  *              sortorder (L_SORT_INCREASING or L_SORT_DECREASING)
  *      Return: na giving an array of indices that would sort
  *              the input array, or null on error
  */
 NUMA *
 numaGetSortIndex(NUMA    *na,
                  l_int32  sortorder)
 {
 l_int32     i, n, gap, j;
 l_float32   tmp;
 l_float32  *array;   /* copy of input array */
 l_float32  *iarray;  /* array of indices */
 NUMA       *naisort;

     PROCNAME("numaGetSortIndex");

     if (!na)
         return (NUMA *)ERROR_PTR("na not defined", procName, NULL);
     if (sortorder != L_SORT_INCREASING && sortorder != L_SORT_DECREASING)
         return (NUMA *)ERROR_PTR("invalid sortorder", procName, NULL);

     n = numaGetCount(na);
     if ((array = numaGetFArray(na, L_COPY)) == NULL)
         return (NUMA *)ERROR_PTR("array not made", procName, NULL);
     if ((iarray = (l_float32 *)CALLOC(n, sizeof(l_float32))) == NULL)
         return (NUMA *)ERROR_PTR("iarray not made", procName, NULL);
     for (i = 0; i < n; i++)
         iarray[i] = i;

         /* Shell sort */
     for (gap = n/2; gap > 0; gap = gap / 2) {
         for (i = gap; i < n; i++) {
             for (j = i - gap; j >= 0; j -= gap) {
                 if ((sortorder == L_SORT_INCREASING &&
                      array[j] > array[j + gap]) ||
                     (sortorder == L_SORT_DECREASING &&
                      array[j] < array[j + gap]))
                 {
                     tmp = array[j];
                     array[j] = array[j + gap];
                     array[j + gap] = tmp;
                     tmp = iarray[j];
                     iarray[j] = iarray[j + gap];
                     iarray[j + gap] = tmp;
                 }
             }
         }
     }

     naisort = numaCreate(n);
     for (i = 0; i < n; i++)
         numaAddNumber(naisort, iarray[i]);

     FREE(array);
     FREE(iarray);
     return naisort;
 }


 /*!
  *  numaSortByIndex()
  *
  *      Input:  nas
  *              naindex (na that maps from the new numa to the input numa)
  *      Return: nad (sorted), or null on error
  */
 NUMA *
 numaSortByIndex(NUMA  *nas,
                 NUMA  *naindex)
 {
 l_int32    i, n, index;
 l_float32  val;
 NUMA      *nad;

     PROCNAME("numaSortByIndex");

     if (!nas)
         return (NUMA *)ERROR_PTR("nas not defined", procName, NULL);
     if (!naindex)
         return (NUMA *)ERROR_PTR("naindex not defined", procName, NULL);

     n = numaGetCount(nas);
     nad = numaCreate(n);
     for (i = 0; i < n; i++) {
         numaGetIValue(naindex, i, &index);
         numaGetFValue(nas, index, &val);
         numaAddNumber(nad, val);
     }

     return nad;
 }


 /*!
  *  numaIsSorted()
  *
  *      Input:  nas
  *              sortorder (L_SORT_INCREASING or L_SORT_DECREASING)
  *              &sorted (<return> 1 if sorted; 0 if not)
  *      Return: 1 if OK; 0 on error
  *
  *  Notes:
  *      (1) This is a quick O(n) test if nas is sorted.  It is useful
  *          in situations where the array is likely to be already
  *          sorted, and a sort operation can be avoided.
  */
 l_int32
 numaIsSorted(NUMA     *nas,
              l_int32   sortorder,
 	     l_int32  *psorted)
 {
 l_int32    i, n;
 l_float32  preval, val;

     PROCNAME("numaIsSorted");

     if (!psorted)
         return ERROR_INT("&sorted not defined", procName, 1);
     *psorted = FALSE;
     if (!nas)
         return ERROR_INT("nas not defined", procName, 1);
     if (sortorder != L_SORT_INCREASING && sortorder != L_SORT_DECREASING)
         return ERROR_INT("invalid sortorder", procName, 1);

     n = numaGetCount(nas);
     numaGetFValue(nas, 0, &preval);
     for (i = 1; i < n; i++) {
         numaGetFValue(nas, i, &val);
         if ((sortorder == L_SORT_INCREASING && val < preval) ||
             (sortorder == L_SORT_DECREASING && val > preval))
             return 0;
     }

     *psorted = TRUE;
     return 0;
 }


 /*!
  *  numaSortPair()
  *
  *      Input:  nax, nay (input arrays)
  *              sortorder (L_SORT_INCREASING or L_SORT_DECREASING)
  *              &nasx (<return> sorted)
  *              &naxy (<return> sorted exactly in order of nasx)
  *      Return: 0 if OK, 1 on error
  *
  *  Notes:
  *      (1) This function sorts the two input arrays, nax and nay,
  *          together, using nax as the key for sorting.
  */
 l_int32
 numaSortPair(NUMA    *nax,
              NUMA    *nay,
              l_int32  sortorder,
              NUMA   **pnasx,
              NUMA   **pnasy)
 {
 l_int32  sorted;
 NUMA    *naindex;

     PROCNAME("numaSortPair");

     if (!pnasx)
         return ERROR_INT("&nasx not defined", procName, 1);
     if (!pnasy)
         return ERROR_INT("&nasy not defined", procName, 1);
     *pnasx = *pnasy = NULL;
     if (!nax)
         return ERROR_INT("nax not defined", procName, 1);
     if (!nay)
         return ERROR_INT("nay not defined", procName, 1);
     if (sortorder != L_SORT_INCREASING && sortorder != L_SORT_DECREASING)
         return ERROR_INT("invalid sortorder", procName, 1);

     numaIsSorted(nax, sortorder, &sorted);
     if (sorted == TRUE) {
         *pnasx = numaCopy(nax);
         *pnasy = numaCopy(nay);
     }
     else {
         naindex = numaGetSortIndex(nax, sortorder);
 	*pnasx = numaSortByIndex(nax, naindex);
 	*pnasy = numaSortByIndex(nay, naindex);
 	numaDestroy(&naindex);
     }

     return 0;
 }


 /*!
  *  numaPseudorandomSequence()
  *
  *      Input:  size (of sequence)
  *              seed (prime number; use 0 for default)
  *      Return: na (pseudorandom on {0,...,size - 1}), or null on error
  *
  *  Notes:
  *      (1) Result is a permutation of the sequence of integers
  *          from 0 to size - 1, where (seed % size) is repeatedly
  *          added to the previous result, and the result is taken mod size.
  *          This is not particularly random!
  */
 NUMA *
 numaPseudorandomSequence(l_int32  size,
                          l_int32  seed)
 {
 l_int32  i, val;
 NUMA    *na;

     PROCNAME("numaPseudorandomSequence");

     if (size <= 0)
         return (NUMA *)ERROR_PTR("size <= 0", procName, NULL);
     if (seed == 0)
         seed = 165653;

     if ((na = numaCreate(size)) == NULL)
         return (NUMA *)ERROR_PTR("na not made", procName, NULL);
     val = seed / 7;
     for (i = 0; i < size; i++) {
         val = (val + seed) % size;
         numaAddNumber(na, val);
     }

     return na;
 }


 /*----------------------------------------------------------------------*
  *                     Functions requiring sorting                      *
  *----------------------------------------------------------------------*/
 /*!
  *  numaGetMedian()
  *
  *      Input:  na
  *              &val  (<return> median val)
  *      Return: 0 if OK; 1 on error
  *
  *  Notes:
  *      (1) Computes the median value of the numbers in the numa, by
  *          sorting and finding the middle value in the sorted array.
  */
 l_int32
 numaGetMedian(NUMA       *na,
               l_float32  *pval)
 {
 l_int32  n;
 NUMA    *nasort;

     PROCNAME("numaGetMedian");

     if (!na)
         return ERROR_INT("na not defined", procName, 1);
     if (!pval)
         return ERROR_INT("&val not defined", procName, 1);
     *pval = 0.0;  /* init */

     n = numaGetCount(na);
     if (n == 0)
         return 1;
     if ((nasort = numaSort(NULL, na, L_SORT_DECREASING)) == NULL)
         return ERROR_INT("nasort not made", procName, 1);
     numaGetFValue(nasort, n / 2, pval);

     numaDestroy(&nasort);
     return 0;
 }


 /*!
  *  numaGetMode()
  *
  *      Input:  na
  *              &val  (<return> mode val)
  *              &count  (<optional return> mode count)
  *      Return: 0 if OK; 1 on error
  *
  *  Notes:
  *      (1) Computes the mode value of the numbers in the numa, by
  *          sorting and finding the value of the number with the
  *          largest count.
  *      (2) Optionally, also returns that count.
  */
 l_int32
 numaGetMode(NUMA       *na,
             l_float32  *pval,
             l_int32    *pcount)
 {
 l_int32     i, n, maxcount, prevcount;
 l_float32   val, maxval, prevval;
 l_float32  *array;
 NUMA       *nasort;

     PROCNAME("numaGetMode");

     if (!na)
         return ERROR_INT("na not defined", procName, 1);
     if (!pval)
         return ERROR_INT("&val not defined", procName, 1);

     *pval = 0.0;
     if (pcount) *pcount = 0;
     if ((n = numaGetCount(na)) == 0)
         return 1;

     if ((nasort = numaSort(NULL, na, L_SORT_DECREASING)) == NULL)
         return ERROR_INT("nas not made", procName, 1);
     array = numaGetFArray(nasort, L_NOCOPY);

         /* Initialize with array[0] */
     prevval = array[0];
     prevcount = 1;
     maxval = prevval;
     maxcount = prevcount;

         /* Scan the sorted array, aggregating duplicates */
     for (i = 1; i < n; i++) {
         val = array[i];
         if (val == prevval)
             prevcount++;
         else {  /* new value */
             if (prevcount > maxcount) {  /* new max */
                 maxcount = prevcount;
                 maxval = prevval;
             }
             prevval = val;
             prevcount = 1;
         }
     }

         /* Was the mode the last run of elements? */
     if (prevcount > maxcount) {
         maxcount = prevcount;
         maxval = prevval;
     }

     *pval = maxval;
     if (pcount)
         *pcount = maxcount;

     numaDestroy(&nasort);
     return 0;
 }


 /*----------------------------------------------------------------------*
  *                          Numa combination                            *
  *----------------------------------------------------------------------*/
 /*!
  *  numaJoin()
  *
  *      Input:  nad  (dest numa; add to this one)
  *              nas  (<optional> source numa; add from this one)
  *              istart  (starting index in nas)
  *              iend  (ending index in nas; use 0 to cat all)
  *      Return: 0 if OK, 1 on error
  *
  *  Notes:
  *      (1) istart < 0 is taken to mean 'read from the start' (istart = 0)
  *      (2) iend <= 0 means 'read to the end'
  *      (3) if nas == NULL, this is a no-op
  */
 l_int32
 numaJoin(NUMA    *nad,
          NUMA    *nas,
          l_int32  istart,
          l_int32  iend)
 {
 l_int32    ns, i;
 l_float32  val;

     PROCNAME("numaJoin");

     if (!nad)
         return ERROR_INT("nad not defined", procName, 1);
     if (!nas)
         return 0;
     ns = numaGetCount(nas);
     if (istart < 0)
         istart = 0;
     if (istart >= ns)
         return ERROR_INT("istart out of bounds", procName, 1);
     if (iend <= 0)
         iend = ns - 1;
     if (iend >= ns)
         return ERROR_INT("iend out of bounds", procName, 1);
     if (istart > iend)
         return ERROR_INT("istart > iend; nothing to add", procName, 1);

     for (i = istart; i <= iend; i++) {
         numaGetFValue(nas, i, &val);
         numaAddNumber(nad, val);
     }

     return 0;
 }


 /*!
  *  numaaFlattenToNuma()
  *
  *      Input:  numaa
  *      Return: numa, or null on error
  *
  *  Notes:
  *      (1) This 'flattens' the Numaa to a Numa, by joining successively
  *          each Numa in the Numaa.
  *      (2) It doesn't make any assumptions about the location of the
  *          Numas in the Numaa array, unlike most Numaa functions.
  *      (3) It leaves the input Numaa unchanged.
  */
 NUMA *
 numaaFlattenToNuma(NUMAA  *naa)
 {
 l_int32  i, nalloc;
 NUMA    *na, *nad;
 NUMA   **array;

     PROCNAME("numaaFlattenToNuma");

     if (!naa)
         return (NUMA *)ERROR_PTR("naa not defined", procName, NULL);

     nalloc = naa->nalloc;
     array = numaaGetPtrArray(naa);
     nad = numaCreate(0);
     for (i = 0; i < nalloc; i++) {
         na = array[i];
         if (!na) continue;
         numaJoin(nad, na, 0, 0);
     }

     return nad;
 }