liblept/grayquant.c - platform/external/tesseract - Git at Google

 /*====================================================================*
  -  Copyright (C) 2001 Leptonica.  All rights reserved.
  -  This software is distributed in the hope that it will be
  -  useful, but with NO WARRANTY OF ANY KIND.
  -  No author or distributor accepts responsibility to anyone for the
  -  consequences of using this software, or for whether it serves any
  -  particular purpose or works at all, unless he or she says so in
  -  writing.  Everyone is granted permission to copy, modify and
  -  redistribute this source code, for commercial or non-commercial
  -  purposes, with the following restrictions: (1) the origin of this
  -  source code must not be misrepresented; (2) modified versions must
  -  be plainly marked as such; and (3) this notice may not be removed
  -  or altered from any source or modified source distribution.
  *====================================================================*/

 /*
  *  grayquant.c
  *
  *      Thresholding from 8 bpp to 1 bpp
  *
  *          Floyd-Steinberg dithering to binary
  *              PIX    *pixDitherToBinary()
  *              PIX    *pixDitherToBinarySpec()
  *
  *          Simple (pixelwise) binarization with fixed threshold
  *              PIX    *pixThresholdToBinary()
  *
  *          Binarization with variable threshold
  *              PIX    *pixVarThresholdToBinary()
  *
  *          Slower implementation of Floyd-Steinberg dithering, using LUTs
  *              PIX    *pixDitherToBinaryLUT()
  *
  *          Generate a binary mask from pixels of particular values
  *              PIX    *pixGenerateMaskByValue()
  *              PIX    *pixGenerateMaskByBand()
  *
  *      Thresholding from 8 bpp to 2 bpp
  *
  *          Dithering to 2 bpp
  *              PIX      *pixDitherTo2bpp()
  *              PIX      *pixDitherTo2bppSpec()
  *
  *          Simple (pixelwise) thresholding to 2 bpp with optional cmap
  *              PIX      *pixThresholdTo2bpp()
  *
  *      Simple (pixelwise) thresholding from 8 bpp to 4 bpp
  *              PIX      *pixThresholdTo4bpp()
  *
  *      Simple (pixelwise) quantization on 8 bpp grayscale
  *              PIX      *pixThresholdOn8bpp()
  *
  *      Arbitrary (pixelwise) thresholding from 8 bpp to 2, 4 or 8 bpp
  *              PIX      *pixThresholdGrayArb()
  *
  *      Quantization tables for linear thresholds of grayscale images
  *              l_int32  *makeGrayQuantIndexTable()
  *              l_int32  *makeGrayQuantTargetTable()
  *
  *      Quantization table for arbitrary thresholding of grayscale images
  *              l_int32   makeGrayQuantTableArb()
  *              l_int32   makeGrayQuantColormapArb()
  *
  *      Thresholding from 32 bpp rgb to 1 bpp
  *      (really color quantization, but it's better placed in this file)
  *              PIX      *pixGenerateMaskByBand32()
  *              PIX      *pixGenerateMaskByDiscr32()
  *
  *      Histogram-based grayscale quantization
  *              PIX      *pixGrayQuantFromHisto()
  *       static l_int32   numaFillCmapFromHisto()
  *
  *      Color quantize grayscale image using existing colormap
  *              PIX      *pixGrayQuantFromCmap()
  */

 #include <stdio.h>
 #include <stdlib.h>
 #include <string.h>
 #include <math.h>
 #include "allheaders.h"


 static l_int32 numaFillCmapFromHisto(NUMA *na, PIXCMAP *cmap,
                                      l_float32 minfract, l_int32 maxsize,
                                      l_int32 **plut);


 /*------------------------------------------------------------------*
  *             Binarization by Floyd-Steinberg dithering            *
  *------------------------------------------------------------------*/
 /*!
  *  pixDitherToBinary()
  *
  *      Input:  pixs
  *      Return: pixd (dithered binary), or null on error
  *
  *  The Floyd-Steinberg error diffusion dithering algorithm
  *  binarizes an 8 bpp grayscale image to a threshold of 128.
  *  If a pixel has a value above 127, it is binarized to white
  *  and the excess (below 255) is subtracted from three
  *  neighboring pixels in the fractions 3/8 to (i, j+1),
  *  3/8 to (i+1, j) and 1/4 to (i+1,j+1), truncating to 0
  *  if necessary.  Likewise, if it the pixel has a value
  *  below 128, it is binarized to black and the excess above 0
  *  is added to the neighboring pixels, truncating to 255 if necessary.
  *
  *  This function differs from straight dithering in that it allows
  *  clipping of grayscale to 0 or 255 if the values are
  *  sufficiently close, without distribution of the excess.
  *  This uses default values to specify the range of lower
  *  and upper values (near 0 and 255, rsp) that are clipped
  *  to black and white without propagating the excess.
  *  Not propagating the excess has the effect of reducing the
  *  snake patterns in parts of the image that are nearly black or white;
  *  however, it also prevents the attempt to reproduce gray for those values.
  *
  *  The implementation is straightforward.  It uses a pair of
  *  line buffers to avoid changing pixs.  It is about 2x faster
  *  than the implementation using LUTs.
  */
 PIX *
 pixDitherToBinary(PIX  *pixs)
 {
     PROCNAME("pixDitherToBinary");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     if (pixGetDepth(pixs) != 8)
         return (PIX *)ERROR_PTR("must be 8 bpp for dithering", procName, NULL);

     return pixDitherToBinarySpec(pixs, DEFAULT_CLIP_LOWER_1,
                                  DEFAULT_CLIP_UPPER_1);
 }


 /*!
  *  pixDitherToBinarySpec()
  *
  *      Input:  pixs
  *              lowerclip (lower clip distance to black; use 0 for default)
  *              upperclip (upper clip distance to white; use 0 for default)
  *      Return: pixd (dithered binary), or null on error
  *
  *  Notes:
  *      (1) See comments above in pixDitherToBinary() for details.
  *      (2) The input parameters lowerclip and upperclip specify the range
  *          of lower and upper values (near 0 and 255, rsp) that are
  *          clipped to black and white without propagating the excess.
  *          For that reason, lowerclip and upperclip should be small numbers.
  */
 PIX *
 pixDitherToBinarySpec(PIX     *pixs,
                       l_int32  lowerclip,
                       l_int32  upperclip)
 {
 l_int32    w, h, d, wplt, wpld;
 l_uint32  *datat, *datad;
 l_uint32  *bufs1, *bufs2;
 PIX       *pixt, *pixd;

     PROCNAME("pixDitherToBinarySpec");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     pixGetDimensions(pixs, &w, &h, &d);
     if (d != 8)
         return (PIX *)ERROR_PTR("must be 8 bpp for dithering", procName, NULL);
     if (lowerclip < 0 || lowerclip > 255)
         return (PIX *)ERROR_PTR("invalid value for lowerclip", procName, NULL);
     if (upperclip < 0 || upperclip > 255)
         return (PIX *)ERROR_PTR("invalid value for upperclip", procName, NULL);

     if ((pixd = pixCreate(w, h, 1)) == NULL)
         return (PIX *)ERROR_PTR("pixd not made", procName, NULL);
     pixCopyResolution(pixd, pixs);
     datad = pixGetData(pixd);
     wpld = pixGetWpl(pixd);

         /* Remove colormap if it exists */
     pixt = pixRemoveColormap(pixs, REMOVE_CMAP_TO_GRAYSCALE);
     datat = pixGetData(pixt);
     wplt = pixGetWpl(pixt);

         /* Two line buffers, 1 for current line and 2 for next line */
     if ((bufs1 = (l_uint32 *)CALLOC(wplt, sizeof(l_uint32))) == NULL)
         return (PIX *)ERROR_PTR("bufs1 not made", procName, NULL);
     if ((bufs2 = (l_uint32 *)CALLOC(wplt, sizeof(l_uint32))) == NULL)
         return (PIX *)ERROR_PTR("bufs2 not made", procName, NULL);

     ditherToBinaryLow(datad, w, h, wpld, datat, wplt, bufs1, bufs2,
                       lowerclip, upperclip);

     FREE(bufs1);
     FREE(bufs2);
     pixDestroy(&pixt);

     return pixd;
 }


 /*------------------------------------------------------------------*
  *       Simple (pixelwise) binarization with fixed threshold       *
  *------------------------------------------------------------------*/
 /*!
  *  pixThresholdToBinary()
  *
  *      Input:  pixs (4 or 8 bpp)
  *              threshold value
  *      Return: pixd (1 bpp), or null on error
  *
  *  Notes:
  *      (1) If the source pixel is less than the threshold value,
  *          the dest will be 1; otherwise, it will be 0
  */
 PIX *
 pixThresholdToBinary(PIX     *pixs,
                      l_int32  thresh)
 {
 l_int32    d, w, h, wplt, wpld;
 l_uint32  *datat, *datad;
 PIX       *pixt, *pixd;

     PROCNAME("pixThresholdToBinary");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     pixGetDimensions(pixs, &w, &h, &d);
     if (d != 4 && d != 8)
         return (PIX *)ERROR_PTR("pixs must be 4 or 8 bpp", procName, NULL);
     if (thresh < 0)
         return (PIX *)ERROR_PTR("thresh must be non-negative", procName, NULL);
     if (d == 4 && thresh > 16)
         return (PIX *)ERROR_PTR("4 bpp thresh not in {0-16}", procName, NULL);
     if (d == 8 && thresh > 256)
         return (PIX *)ERROR_PTR("8 bpp thresh not in {0-256}", procName, NULL);

     if ((pixd = pixCreate(w, h, 1)) == NULL)
         return (PIX *)ERROR_PTR("pixd not made", procName, NULL);
     pixCopyResolution(pixd, pixs);
     datad = pixGetData(pixd);
     wpld = pixGetWpl(pixd);

         /* Remove colormap if it exists.  If there is a colormap,
          * pixt will be 8 bpp regardless of the depth of pixs. */
     pixt = pixRemoveColormap(pixs, REMOVE_CMAP_TO_GRAYSCALE);
     datat = pixGetData(pixt);
     wplt = pixGetWpl(pixt);
     if (pixGetColormap(pixs) && d == 4) {  /* promoted to 8 bpp */
         d = 8;
         thresh *= 16;
     }

     thresholdToBinaryLow(datad, w, h, wpld, datat, d, wplt, thresh);
     pixDestroy(&pixt);
     return pixd;
 }


 /*------------------------------------------------------------------*
  *                Binarization with variable threshold              *
  *------------------------------------------------------------------*/
 /*!
  *  pixVarThresholdToBinary()
  *
  *      Input:  pixs (8 bpp)
  *              pixg (8 bpp; contains threshold values for each pixel)
  *      Return: pixd (1 bpp), or null on error
  *
  *  Notes:
  *      (1) If the pixel in pixs is less than the corresponding pixel
  *          in pixg, the dest will be 1; otherwise it will be 0.
  */
 PIX *
 pixVarThresholdToBinary(PIX  *pixs,
                         PIX  *pixg)
 {
 l_int32    i, j, vals, valg, w, h, d, wpls, wplg, wpld;
 l_uint32  *datas, *datag, *datad, *lines, *lineg, *lined;
 PIX       *pixd;

     PROCNAME("pixVarThresholdToBinary");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     if (!pixg)
         return (PIX *)ERROR_PTR("pixg not defined", procName, NULL);
     if (!pixSizesEqual(pixs, pixg))
         return (PIX *)ERROR_PTR("pix sizes not equal", procName, NULL);
     pixGetDimensions(pixs, &w, &h, &d);
     if (d != 8)
         return (PIX *)ERROR_PTR("pixs must be 8 bpp", procName, NULL);

     pixd = pixCreate(w, h, 1);
     datad = pixGetData(pixd);
     wpld = pixGetWpl(pixd);
     datas = pixGetData(pixs);
     wpls = pixGetWpl(pixs);
     datag = pixGetData(pixg);
     wplg = pixGetWpl(pixg);
     for (i = 0; i < h; i++) {
         lines = datas + i * wpls;
         lineg = datag + i * wplg;
         lined = datad + i * wpld;
         for (j = 0; j < w; j++) {
             vals = GET_DATA_BYTE(lines, j);
             valg = GET_DATA_BYTE(lineg, j);
             if (vals < valg)
                 SET_DATA_BIT(lined, j);
         }
     }

     return pixd;
 }


 /*--------------------------------------------------------------------*
  *    Slower implementation of binarization by dithering using LUTs   *
  *--------------------------------------------------------------------*/
 /*!
  *  pixDitherToBinaryLUT()
  *
  *      Input:  pixs
  *              lowerclip (lower clip distance to black; use -1 for default)
  *              upperclip (upper clip distance to white; use -1 for default)
  *      Return: pixd (dithered binary), or null on error
  *
  *  This implementation is deprecated.  You should use pixDitherToBinary().
  *
  *  See comments in pixDitherToBinary()
  *
  *  This implementation additionally uses three lookup tables to
  *  generate the output pixel value and the excess or deficit
  *  carried over to the neighboring pixels.
  */
 PIX *
 pixDitherToBinaryLUT(PIX     *pixs,
                      l_int32  lowerclip,
                      l_int32  upperclip)
 {
 l_int32    w, h, d, wplt, wpld;
 l_int32   *tabval, *tab38, *tab14;
 l_uint32  *datat, *datad;
 l_uint32  *bufs1, *bufs2;
 PIX       *pixt, *pixd;

     PROCNAME("pixDitherToBinaryLUT");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     pixGetDimensions(pixs, &w, &h, &d);
     if (d != 8)
         return (PIX *)ERROR_PTR("must be 8 bpp for dithering", procName, NULL);
     if (lowerclip < 0)
         lowerclip = DEFAULT_CLIP_LOWER_1;
     if (upperclip < 0)
         upperclip = DEFAULT_CLIP_UPPER_1;

     if ((pixd = pixCreate(w, h, 1)) == NULL)
         return (PIX *)ERROR_PTR("pixd not made", procName, NULL);
     pixCopyResolution(pixd, pixs);
     datad = pixGetData(pixd);
     wpld = pixGetWpl(pixd);

         /* Remove colormap if it exists */
     pixt = pixRemoveColormap(pixs, REMOVE_CMAP_TO_GRAYSCALE);
     datat = pixGetData(pixt);
     wplt = pixGetWpl(pixt);

         /* Two line buffers, 1 for current line and 2 for next line */
     if ((bufs1 = (l_uint32 *)CALLOC(wplt, sizeof(l_uint32))) == NULL)
         return (PIX *)ERROR_PTR("bufs1 not made", procName, NULL);
     if ((bufs2 = (l_uint32 *)CALLOC(wplt, sizeof(l_uint32))) == NULL)
         return (PIX *)ERROR_PTR("bufs2 not made", procName, NULL);

         /* 3 lookup tables: 1-bit value, (3/8)excess, and (1/4)excess */
     make8To1DitherTables(&tabval, &tab38, &tab14, lowerclip, upperclip);

     ditherToBinaryLUTLow(datad, w, h, wpld, datat, wplt, bufs1, bufs2,
                          tabval, tab38, tab14);

     FREE(bufs1);
     FREE(bufs2);
     FREE(tabval);
     FREE(tab38);
     FREE(tab14);
     pixDestroy(&pixt);

     return pixd;
 }


 /*--------------------------------------------------------------------*
  *       Generate a binary mask from pixels of particular value(s)    *
  *--------------------------------------------------------------------*/
 /*!
  *  pixGenerateMaskByValue()
  *
  *      Input:  pixs (8 bpp, or colormapped)
  *              val (of pixels for which we set 1 in dest)
  *      Return: pixd (1 bpp), or null on error
  *
  *  Notes:
  *      (1) @val is the gray value of the pixels that we are selecting.
  *      (2) If pixs is colormapped, this first removes the colormap to
  *          generate an approximate grayscale value for each pixel, and
  *          then looks for gray pixels with the value @val.
  *      (3) If pixs is colormapped and you want to use @val to select
  *          the colormap index, you must first call pixDestroyColormap(pixs)
  *          to remove the colormap from pixs.
  */
 PIX *
 pixGenerateMaskByValue(PIX     *pixs,
                        l_int32  val)
 {
 l_int32    i, j, w, h, wplg, wpld;
 l_uint32  *datag, *datad, *lineg, *lined;
 PIX       *pixg, *pixd;

     PROCNAME("pixGenerateMaskByValue");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     if (pixGetDepth(pixs) != 8)
         return (PIX *)ERROR_PTR("not 8 bpp", procName, NULL);
     if (val < 0 || val > 255)
         return (PIX *)ERROR_PTR("val out of 8 bpp range", procName, NULL);

     if (pixGetColormap(pixs))
         pixg = pixRemoveColormap(pixs, REMOVE_CMAP_TO_GRAYSCALE);
     else
         pixg = pixClone(pixs);

     pixGetDimensions(pixg, &w, &h, NULL);
     pixd = pixCreate(w, h, 1);
     pixCopyResolution(pixd, pixg);
     datag = pixGetData(pixg);
     wplg = pixGetWpl(pixg);
     datad = pixGetData(pixd);
     wpld = pixGetWpl(pixd);
     for (i = 0; i < h; i++) {
         lineg = datag + i * wplg;
         lined = datad + i * wpld;
         for (j = 0; j < w; j++) {
             if (GET_DATA_BYTE(lineg, j) == val)
                 SET_DATA_BIT(lined, j);
         }
     }

     pixDestroy(&pixg);
     return pixd;
 }


 /*!
  *  pixGenerateMaskByBand()
  *
  *      Input:  pixs (8 bpp, or colormapped)
  *              lower, upper (two pixel values from which a range, either
  *                            between (inband) or outside of (!inband),
  *                            determines which pixels in pixs cause us to
  *                            set a 1 in the dest mask)
  *              inband (1 for finding pixels in [lower, upper];
  *                      0 for finding pixels in [0, lower) union (upper, 255])
  *      Return: pixd (1 bpp), or null on error
  *
  *  Notes:
  *      (1) Generates a 1 bpp mask pixd, the same size as pixs, where
  *          the fg pixels in the mask are those either within the specified
  *          band (for inband == 1) or outside the specified band
  *          (for inband == 0).
  *      (2) If pixs is colormapped, this first removes the colormap to
  *          generate an approximate grayscale value for each pixel, and
  *          then looks for gray pixels in or out of the given band.
  *      (3) If pixs is colormapped and you want to the band of values to
  *          select the colormap indices directly, you must first call
  *          pixDestroyColormap(pixs) to remove the colormap from pixs.
  */
 PIX *
 pixGenerateMaskByBand(PIX     *pixs,
                       l_int32  lower,
                       l_int32  upper,
                       l_int32  inband)
 {
 l_int32    i, j, w, h, wplg, wpld, val;
 l_uint32  *datag, *datad, *lineg, *lined;
 PIX       *pixg, *pixd;

     PROCNAME("pixGenerateMaskByBand");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     if (pixGetDepth(pixs) != 8)
         return (PIX *)ERROR_PTR("not 8 bpp", procName, NULL);
     if (lower < 0 || upper > 255)
         return (PIX *)ERROR_PTR("invalid lower and/or upper", procName, NULL);
     if (lower > upper)
         return (PIX *)ERROR_PTR("lower > upper!", procName, NULL);

     if (pixGetColormap(pixs))
         pixg = pixRemoveColormap(pixs, REMOVE_CMAP_TO_GRAYSCALE);
     else
         pixg = pixClone(pixs);

     pixGetDimensions(pixg, &w, &h, NULL);
     pixd = pixCreate(w, h, 1);
     pixCopyResolution(pixd, pixg);
     datag = pixGetData(pixg);
     wplg = pixGetWpl(pixg);
     datad = pixGetData(pixd);
     wpld = pixGetWpl(pixd);
     for (i = 0; i < h; i++) {
         lineg = datag + i * wplg;
         lined = datad + i * wpld;
         for (j = 0; j < w; j++) {
             val = GET_DATA_BYTE(lineg, j);
             if (inband) {
                 if (val >= lower && val <= upper)
                     SET_DATA_BIT(lined, j);
             }
             else {  /* out of band */
                 if (val < lower || val > upper)
                     SET_DATA_BIT(lined, j);
             }
         }
     }

     pixDestroy(&pixg);
     return pixd;
 }


 /*------------------------------------------------------------------*
  *                Thresholding to 2 bpp by dithering                *
  *------------------------------------------------------------------*/
 /*!
  *  pixDitherTo2bpp()
  *
  *      Input:  pixs (8 bpp)
  *              cmapflag (1 to generate a colormap)
  *      Return: pixd (dithered 2 bpp), or null on error
  *
  *  An analog of the Floyd-Steinberg error diffusion dithering
  *  algorithm is used to "dibitize" an 8 bpp grayscale image
  *  to 2 bpp, using equally spaced gray values of 0, 85, 170, and 255,
  *  which are served by thresholds of 43, 128 and 213.
  *  If cmapflag == 1, the colormap values are set to 0, 85, 170 and 255.
  *  If a pixel has a value between 0 and 42, it is dibitized
  *  to 0, and the excess (above 0) is added to the
  *  three neighboring pixels, in the fractions 3/8 to (i, j+1),
  *  3/8 to (i+1, j) and 1/4 to (i+1, j+1), truncating to 255 if
  *  necessary.  If a pixel has a value between 43 and 127, it is
  *  dibitized to 1, and the excess (above 85) is added to the three
  *  neighboring pixels as before.  If the value is below 85, the
  *  excess is subtracted.  With a value between 128
  *  and 212, it is dibitized to 2, with the excess on either side
  *  of 170 distributed as before.  Finally, with a value between
  *  213 and 255, it is dibitized to 3, with the excess (below 255)
  *  subtracted from the neighbors.  We always truncate to 0 or 255.
  *  The details can be seen in the lookup table generation.
  *
  *  This function differs from straight dithering in that it allows
  *  clipping of grayscale to 0 or 255 if the values are
  *  sufficiently close, without distribution of the excess.
  *  This uses default values (from pix.h) to specify the range of lower
  *  and upper values (near 0 and 255, rsp) that are clipped to black
  *  and white without propagating the excess.
  *  Not propagating the excess has the effect of reducing the snake
  *  patterns in parts of the image that are nearly black or white;
  *  however, it also prevents any attempt to reproduce gray for those values.
  *
  *  The implementation uses 3 lookup tables for simplicity, and
  *  a pair of line buffers to avoid modifying pixs.
  */
 PIX *
 pixDitherTo2bpp(PIX     *pixs,
                 l_int32  cmapflag)
 {
     PROCNAME("pixDitherTo2bpp");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     if (pixGetDepth(pixs) != 8)
         return (PIX *)ERROR_PTR("must be 8 bpp for dithering", procName, NULL);

     return pixDitherTo2bppSpec(pixs, DEFAULT_CLIP_LOWER_2,
                                DEFAULT_CLIP_UPPER_2, cmapflag);
 }


 /*!
  *  pixDitherTo2bppSpec()
  *
  *      Input:  pixs (8 bpp)
  *              lowerclip (lower clip distance to black; use 0 for default)
  *              upperclip (upper clip distance to white; use 0 for default)
  *              cmapflag (1 to generate a colormap)
  *      Return: pixd (dithered 2 bpp), or null on error
  *
  *  Notes:
  *      (1) See comments above in pixDitherTo2bpp() for details.
  *      (2) The input parameters lowerclip and upperclip specify the range
  *          of lower and upper values (near 0 and 255, rsp) that are
  *          clipped to black and white without propagating the excess.
  *          For that reason, lowerclip and upperclip should be small numbers.
  */
 PIX *
 pixDitherTo2bppSpec(PIX     *pixs,
                     l_int32  lowerclip,
                     l_int32  upperclip,
                     l_int32  cmapflag)
 {
 l_int32    w, h, d, wplt, wpld;
 l_int32   *tabval, *tab38, *tab14;
 l_uint32  *datat, *datad;
 l_uint32  *bufs1, *bufs2;
 PIX       *pixt, *pixd;
 PIXCMAP   *cmap;

     PROCNAME("pixDitherTo2bppSpec");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     pixGetDimensions(pixs, &w, &h, &d);
     if (d != 8)
         return (PIX *)ERROR_PTR("must be 8 bpp for dithering", procName, NULL);
     if (lowerclip < 0 || lowerclip > 255)
         return (PIX *)ERROR_PTR("invalid value for lowerclip", procName, NULL);
     if (upperclip < 0 || upperclip > 255)
         return (PIX *)ERROR_PTR("invalid value for upperclip", procName, NULL);

     if ((pixd = pixCreate(w, h, 2)) == NULL)
         return (PIX *)ERROR_PTR("pixd not made", procName, NULL);
     pixCopyResolution(pixd, pixs);
     datad = pixGetData(pixd);
     wpld = pixGetWpl(pixd);

         /* If there is a colormap, remove it */
     pixt = pixRemoveColormap(pixs, REMOVE_CMAP_TO_GRAYSCALE);
     datat = pixGetData(pixt);
     wplt = pixGetWpl(pixt);

         /* Two line buffers, 1 for current line and 2 for next line */
     if ((bufs1 = (l_uint32 *)CALLOC(wplt, sizeof(l_uint32))) == NULL)
         return (PIX *)ERROR_PTR("bufs1 not made", procName, NULL);
     if ((bufs2 = (l_uint32 *)CALLOC(wplt, sizeof(l_uint32))) == NULL)
         return (PIX *)ERROR_PTR("bufs2 not made", procName, NULL);

         /* 3 lookup tables: 2-bit value, (3/8)excess, and (1/4)excess */
     make8To2DitherTables(&tabval, &tab38, &tab14, lowerclip, upperclip);

     ditherTo2bppLow(datad, w, h, wpld, datat, wplt, bufs1, bufs2,
                     tabval, tab38, tab14);

     if (cmapflag) {
         cmap = pixcmapCreateLinear(2, 4);
         pixSetColormap(pixd, cmap);
     }

     FREE(bufs1);
     FREE(bufs2);
     FREE(tabval);
     FREE(tab38);
     FREE(tab14);
     pixDestroy(&pixt);

     return pixd;
 }


 /*--------------------------------------------------------------------*
  *  Simple (pixelwise) thresholding to 2 bpp with optional colormap   *
  *--------------------------------------------------------------------*/
 /*!
  *  pixThresholdTo2bpp()
  *
  *      Input:  pixs (8 bpp)
  *              nlevels (equally spaced; must be between 2 and 4)
  *              cmapflag (1 to build colormap; 0 otherwise)
  *      Return: pixd (2 bpp, optionally with colormap), or null on error
  *
  *  Notes:
  *      (1) Valid values for nlevels is the set {2, 3, 4}.
  *      (2) Any colormap on the input pixs is removed to 8 bpp grayscale.
  *      (3) This function is typically invoked with cmapflag == 1.
  *          In the situation where no colormap is desired, nlevels is
  *          ignored and pixs is thresholded to 4 levels.
  *      (4) The target output colors are equally spaced, with the
  *          darkest at 0 and the lightest at 255.  The thresholds are
  *          chosen halfway between adjacent output values.  A table
  *          is built that specifies the mapping from src to dest.
  *      (5) If cmapflag == 1, a colormap of size 'nlevels' is made,
  *          and the pixel values in pixs are replaced by their
  *          appropriate color indices.  The number of holdouts,
  *          4 - nlevels, will be between 0 and 2.
  *      (6) If you don't want the thresholding to be equally spaced,
  *          either first transform the 8 bpp src using pixGammaTRC().
  *          or, if cmapflag == 1, after calling this function you can use
  *          pixcmapResetColor() to change any individual colors.
  *      (7) If a colormap is generated, it will specify (to display
  *          programs) exactly how each level is to be represented in RGB
  *          space.  When representing text, 3 levels is far better than
  *          2 because of the antialiasing of the single gray level,
  *          and 4 levels (black, white and 2 gray levels) is getting
  *          close to the perceptual quality of a (nearly continuous)
  *          grayscale image.  With 2 bpp, you can set up a colormap
  *          and allocate from 2 to 4 levels to represent antialiased text.
  *          Any left over colormap entries can be used for coloring regions.
  *          For the same number of levels, the file size of a 2 bpp image
  *          is about 10% smaller than that of a 4 bpp result for the same
  *          number of levels.  For both 2 bpp and 4 bpp, using 4 levels you
  *          get compression far better than that of jpeg, because the
  *          quantization to 4 levels will remove the jpeg ringing in the
  *          background near character edges.
  */
 PIX *
 pixThresholdTo2bpp(PIX     *pixs,
                    l_int32  nlevels,
                    l_int32  cmapflag)
 {
 l_int32   *qtab;
 l_int32    w, h, d, wplt, wpld;
 l_uint32  *datat, *datad;
 PIX       *pixt, *pixd;
 PIXCMAP   *cmap;

     PROCNAME("pixThresholdTo2bpp");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     pixGetDimensions(pixs, &w, &h, &d);
     if (d != 8)
         return (PIX *)ERROR_PTR("pixs not 8 bpp", procName, NULL);
     if (nlevels < 2 || nlevels > 4)
         return (PIX *)ERROR_PTR("nlevels not in {2, 3, 4}", procName, NULL);

         /* Make the appropriate table */
     if (cmapflag)
         qtab = makeGrayQuantIndexTable(nlevels);
     else
         qtab = makeGrayQuantTargetTable(4, 2);

     if ((pixd = pixCreate(w, h, 2)) == NULL)
         return (PIX *)ERROR_PTR("pixd not made", procName, NULL);
     pixCopyResolution(pixd, pixs);
     datad = pixGetData(pixd);
     wpld = pixGetWpl(pixd);

     if (cmapflag) {   /* hold out (4 - nlevels) cmap entries */
         cmap = pixcmapCreateLinear(2, nlevels);
         pixSetColormap(pixd, cmap);
     }

         /* If there is a colormap in the src, remove it */
     pixt = pixRemoveColormap(pixs, REMOVE_CMAP_TO_GRAYSCALE);
     datat = pixGetData(pixt);
     wplt = pixGetWpl(pixt);

     thresholdTo2bppLow(datad, h, wpld, datat, wplt, qtab);

     if (qtab) FREE(qtab);
     pixDestroy(&pixt);
     return pixd;
 }


 /*----------------------------------------------------------------------*
  *               Simple (pixelwise) thresholding to 4 bpp               *
  *----------------------------------------------------------------------*/
 /*!
  *  pixThresholdTo4bpp()
  *
  *      Input:  pixs (8 bpp, can have colormap)
  *              nlevels (equally spaced; must be between 2 and 16)
  *              cmapflag (1 to build colormap; 0 otherwise)
  *      Return: pixd (4 bpp, optionally with colormap), or null on error
  *
  *  Notes:
  *      (1) Valid values for nlevels is the set {2, ... 16}.
  *      (2) Any colormap on the input pixs is removed to 8 bpp grayscale.
  *      (3) This function is typically invoked with cmapflag == 1.
  *          In the situation where no colormap is desired, nlevels is
  *          ignored and pixs is thresholded to 16 levels.
  *      (4) The target output colors are equally spaced, with the
  *          darkest at 0 and the lightest at 255.  The thresholds are
  *          chosen halfway between adjacent output values.  A table
  *          is built that specifies the mapping from src to dest.
  *      (5) If cmapflag == 1, a colormap of size 'nlevels' is made,
  *          and the pixel values in pixs are replaced by their
  *          appropriate color indices.  The number of holdouts,
  *          16 - nlevels, will be between 0 and 14.
  *      (6) If you don't want the thresholding to be equally spaced,
  *          either first transform the 8 bpp src using pixGammaTRC().
  *          or, if cmapflag == 1, after calling this function you can use
  *          pixcmapResetColor() to change any individual colors.
  *      (7) If a colormap is generated, it will specify, to display
  *          programs, exactly how each level is to be represented in RGB
  *          space.  When representing text, 3 levels is far better than
  *          2 because of the antialiasing of the single gray level,
  *          and 4 levels (black, white and 2 gray levels) is getting
  *          close to the perceptual quality of a (nearly continuous)
  *          grayscale image.  Therefore, with 4 bpp, you can set up a
  *          colormap, allocate a relatively small fraction of the 16
  *          possible values to represent antialiased text, and use the
  *          other colormap entries for other things, such as coloring
  *          text or background.  Two other reasons for using a small number
  *          of gray values for antialiased text are (1) PNG compression
  *          gets worse as the number of levels that are used is increased,
  *          and (2) using a small number of levels will filter out most of
  *          the jpeg ringing that is typically introduced near sharp edges
  *          of text.  This filtering is partly responsible for the improved
  *          compression.
  */
 PIX *
 pixThresholdTo4bpp(PIX     *pixs,
                    l_int32  nlevels,
                    l_int32  cmapflag)
 {
 l_int32   *qtab;
 l_int32    w, h, d, wplt, wpld;
 l_uint32  *datat, *datad;
 PIX       *pixt, *pixd;
 PIXCMAP   *cmap;

     PROCNAME("pixThresholdTo4bpp");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     pixGetDimensions(pixs, &w, &h, &d);
     if (d != 8)
         return (PIX *)ERROR_PTR("pixs not 8 bpp", procName, NULL);
     if (nlevels < 2 || nlevels > 16)
         return (PIX *)ERROR_PTR("nlevels not in [2,...,16]", procName, NULL);

         /* Make the appropriate table */
     if (cmapflag)
         qtab = makeGrayQuantIndexTable(nlevels);
     else
         qtab = makeGrayQuantTargetTable(16, 4);

     if ((pixd = pixCreate(w, h, 4)) == NULL)
         return (PIX *)ERROR_PTR("pixd not made", procName, NULL);
     pixCopyResolution(pixd, pixs);
     datad = pixGetData(pixd);
     wpld = pixGetWpl(pixd);

     if (cmapflag) {   /* hold out (16 - nlevels) cmap entries */
         cmap = pixcmapCreateLinear(4, nlevels);
         pixSetColormap(pixd, cmap);
     }

         /* If there is a colormap in the src, remove it */
     pixt = pixRemoveColormap(pixs, REMOVE_CMAP_TO_GRAYSCALE);
     datat = pixGetData(pixt);
     wplt = pixGetWpl(pixt);

     thresholdTo4bppLow(datad, h, wpld, datat, wplt, qtab);

     if (qtab) FREE(qtab);
     pixDestroy(&pixt);
     return pixd;
 }


 /*----------------------------------------------------------------------*
  *    Simple (pixelwise) thresholding on 8 bpp with optional colormap   *
  *----------------------------------------------------------------------*/
 /*!
  *  pixThresholdOn8bpp()
  *
  *      Input:  pixs (8 bpp, can have colormap)
  *              nlevels (equally spaced; must be between 2 and 256)
  *              cmapflag (1 to build colormap; 0 otherwise)
  *      Return: pixd (8 bpp, optionally with colormap), or null on error
  *
  *  Notes:
  *      (1) Valid values for nlevels is the set {2,...,256}.
  *      (2) Any colormap on the input pixs is removed to 8 bpp grayscale.
  *      (3) If cmapflag == 1, a colormap of size 'nlevels' is made,
  *          and the pixel values in pixs are replaced by their
  *          appropriate color indices.  Otherwise, the pixel values
  *          are the actual thresholded (i.e., quantized) grayscale values.
  *      (4) If you don't want the thresholding to be equally spaced,
  *          first transform the input 8 bpp src using pixGammaTRC().
  */
 PIX *
 pixThresholdOn8bpp(PIX     *pixs,
                    l_int32  nlevels,
                    l_int32  cmapflag)
 {
 l_int32   *qtab;  /* quantization table */
 l_int32    i, j, w, h, wpld, val, newval;
 l_uint32  *datad, *lined;
 PIX       *pixd;
 PIXCMAP   *cmap;

     PROCNAME("pixThresholdOn8bpp");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     if (pixGetDepth(pixs) != 8)
         return (PIX *)ERROR_PTR("pixs not 8 bpp", procName, NULL);
     if (nlevels < 2 || nlevels > 256)
         return (PIX *)ERROR_PTR("nlevels not in [2,...,256]", procName, NULL);

     if (cmapflag)
         qtab = makeGrayQuantIndexTable(nlevels);
     else
         qtab = makeGrayQuantTargetTable(nlevels, 8);

         /* Get a new pixd; if there is a colormap in the src, remove it */
     if (pixGetColormap(pixs))
         pixd = pixRemoveColormap(pixs, REMOVE_CMAP_TO_GRAYSCALE);
     else
         pixd = pixCopy(NULL, pixs);

     if (cmapflag) {   /* hold out (256 - nlevels) cmap entries */
         cmap = pixcmapCreateLinear(8, nlevels);
         pixSetColormap(pixd, cmap);
     }

     pixGetDimensions(pixd, &w, &h, NULL);
     datad = pixGetData(pixd);
     wpld = pixGetWpl(pixd);
     for (i = 0; i < h; i++) {
         lined = datad + i * wpld;
         for (j = 0; j < w; j++) {
             val = GET_DATA_BYTE(lined, j);
             newval = qtab[val];
             SET_DATA_BYTE(lined, j, newval);
         }
     }

     if (qtab) FREE(qtab);
     return pixd;
 }


 /*----------------------------------------------------------------------*
  *    Arbitrary (pixelwise) thresholding from 8 bpp to 2, 4 or 8 bpp    *
  *----------------------------------------------------------------------*/
 /*!
  *  pixThresholdGrayArb()
  *
  *      Input:  pixs (8 bpp grayscale; can have colormap)
  *              edgevals (string giving edge value of each bin)
  *              outdepth (0, 2, 4 or 8 bpp; 0 is default for min depth)
  *              use_average (1 if use the average pixel value in colormap)
  *              setblack (1 if darkest color is set to black)
  *              setwhite (1 if lightest color is set to white)
  *      Return: pixd (2, 4 or 8 bpp quantized image with colormap),
  *                    or null on error
  *
  *  Notes:
  *      (1) This function allows exact specification of the quantization bins.
  *          The string @edgevals is a space-separated set of values
  *          specifying the dividing points between output quantization bins.
  *          These threshold values are assigned to the bin with higher
  *          values, so that each of them is the smallest value in their bin.
  *      (2) The output image (pixd) depth is specified by @outdepth.  The
  *          number of bins is the number of edgevals + 1.  The
  *          relation between outdepth and the number of bins is:
  *               outdepth = 2       nbins <= 4
  *               outdepth = 4       nbins <= 16
  *               outdepth = 8       nbins <= 256
  *          With @outdepth == 0, the minimum required depth for the
  *          given number of bins is used.
  *          The output pixd has a colormap.
  *      (3) The last 3 args determine the specific values that go into
  *          the colormap.
  *      (4) For @use_average:
  *            - if TRUE, the average value of pixels falling in the bin is
  *              chosen as the representative gray value.  Otherwise,
  *            - if FALSE, the central value of each bin is chosen as
  *              the representative value.
  *          The colormap holds the representative value.
  *      (5) For @setblack, if TRUE the darkest color is set to (0,0,0).
  *      (6) For @setwhite, if TRUE the lightest color is set to (255,255,255).
  *      (7) An alternative to using this function to quantize to
  *          unequally-spaced bins is to first transform the 8 bpp pixs
  *          using pixGammaTRC(), and follow this with pixThresholdTo4bpp().
  */
 PIX *
 pixThresholdGrayArb(PIX         *pixs,
                     const char  *edgevals,
                     l_int32      outdepth,
                     l_int32      use_average,
                     l_int32      setblack,
                     l_int32      setwhite)
 {
 l_int32   *qtab;
 l_int32    w, h, d, i, j, n, wplt, wpld, val, newval;
 l_uint32  *datat, *datad, *linet, *lined;
 NUMA      *na;
 PIX       *pixt, *pixd;
 PIXCMAP   *cmap;

     PROCNAME("pixThresholdGrayArb");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     pixGetDimensions(pixs, &w, &h, &d);
     if (d != 8)
         return (PIX *)ERROR_PTR("pixs not 8 bpp", procName, NULL);
     if (!edgevals)
         return (PIX *)ERROR_PTR("edgevals not defined", procName, NULL);
     if (outdepth != 0 && outdepth != 2 && outdepth != 4 && outdepth != 8)
         return (PIX *)ERROR_PTR("invalid outdepth", procName, NULL);

         /* Parse and sort (if required) the bin edge values */
     na = parseStringForNumbers(edgevals, " \t\n,");
     n = numaGetCount(na);
     if (n > 255)
         return (PIX *)ERROR_PTR("more than 256 levels", procName, NULL);
     if (outdepth == 0) {
         if (n <= 3)
             outdepth = 2;
         else if (n <= 15)
             outdepth = 4;
         else
             outdepth = 8;
     }
     else if (n + 1 > (1 << outdepth)) {
         L_WARNING("outdepth too small; setting to 8 bpp", procName);
         outdepth = 8;
     }
     numaSort(na, na, L_SORT_INCREASING);

         /* Make the quantization LUT and the colormap */
     makeGrayQuantTableArb(na, outdepth, &qtab, &cmap);
     if (use_average) {  /* use the average value in each bin */
         pixcmapDestroy(&cmap);
 	makeGrayQuantColormapArb(pixs, qtab, outdepth, &cmap);
     }
     pixcmapSetBlackAndWhite(cmap, setblack, setwhite);
     numaDestroy(&na);

     if ((pixd = pixCreate(w, h, outdepth)) == NULL)
         return (PIX *)ERROR_PTR("pixd not made", procName, NULL);
     pixCopyResolution(pixd, pixs);
     pixSetColormap(pixd, cmap);
     datad = pixGetData(pixd);
     wpld = pixGetWpl(pixd);

         /* If there is a colormap in the src, remove it */
     pixt = pixRemoveColormap(pixs, REMOVE_CMAP_TO_GRAYSCALE);
     datat = pixGetData(pixt);
     wplt = pixGetWpl(pixt);

     if (outdepth == 2)
         thresholdTo2bppLow(datad, h, wpld, datat, wplt, qtab);
     else if (outdepth == 4)
         thresholdTo4bppLow(datad, h, wpld, datat, wplt, qtab);
     else {
         for (i = 0; i < h; i++) {
             lined = datad + i * wpld;
             linet = datat + i * wplt;
             for (j = 0; j < w; j++) {
                 val = GET_DATA_BYTE(linet, j);
                 newval = qtab[val];
                 SET_DATA_BYTE(lined, j, newval);
             }
         }
     }

     FREE(qtab);
     pixDestroy(&pixt);
     return pixd;
 }


 /*----------------------------------------------------------------------*
  *     Quantization tables for linear thresholds of grayscale images    *
  *----------------------------------------------------------------------*/
 /*!
  *  makeGrayQuantIndexTable()
  *
  *      Input:  nlevels (number of output levels)
  *      Return: table (maps input gray level to colormap index,
  *                     or null on error)
  *  Notes:
  *      (1) 'nlevels' is some number between 2 and 256 (typically 8 or less).
  *      (2) The table is typically used for quantizing 2, 4 and 8 bpp
  *          grayscale src pix, and generating a colormapped dest pix.
  */
 l_int32 *
 makeGrayQuantIndexTable(l_int32  nlevels)
 {
 l_int32   *tab;
 l_int32    i, j, thresh;

     PROCNAME("makeGrayQuantIndexTable");

     if ((tab = (l_int32 *)CALLOC(256, sizeof(l_int32))) == NULL)
         return (l_int32 *)ERROR_PTR("calloc fail for tab", procName, NULL);
     for (i = 0; i < 256; i++) {
         for (j = 0; j < nlevels; j++) {
             thresh = 255 * (2 * j + 1) / (2 * nlevels - 2);
             if (i <= thresh) {
                 tab[i] = j;
 /*                fprintf(stderr, "tab[%d] = %d\n", i, j); */
                 break;
             }
         }
     }
     return tab;
 }


 /*!
  *  makeGrayQuantTargetTable()
  *
  *      Input:  nlevels (number of output levels)
  *              depth (of dest pix, in bpp; 2, 4 or 8 bpp)
  *      Return: table (maps input gray level to thresholded gray level,
  *                     or null on error)
  *
  *  Notes:
  *      (1) nlevels is some number between 2 and 2^(depth)
  *      (2) The table is used in two similar ways:
  *           - for 8 bpp, it quantizes to a given number of target levels
  *           - for 2 and 4 bpp, it thresholds to appropriate target values
  *             that will use the full dynamic range of the dest pix.
  *      (3) For depth = 8, the number of thresholds chosen is
  *          ('nlevels' - 1), and the 'nlevels' values stored in the
  *          table are at the two at the extreme ends, (0, 255), plus
  *          plus ('nlevels' - 2) values chosen at equal intervals between.
  *          For example, for depth = 8 and 'nlevels' = 3, the two
  *          threshold values are 3f and bf, and the three target pixel
  *          values are 0, 7f and ff.
  *      (4) For depth < 8, we ignore nlevels, and always use the maximum
  *          number of levels, which is 2^(depth).
  *          If you want nlevels < the maximum number, you should always
  *          use a colormap.
  */
 l_int32 *
 makeGrayQuantTargetTable(l_int32  nlevels,
                          l_int32  depth)
 {
 l_int32   *tab;
 l_int32    i, j, thresh, maxval, quantval;

     PROCNAME("makeGrayQuantTargetTable");

     if ((tab = (l_int32 *)CALLOC(256, sizeof(l_int32))) == NULL)
         return (l_int32 *)ERROR_PTR("calloc fail for tab", procName, NULL);
     maxval = (1 << depth) - 1;
     if (depth < 8)
         nlevels = 1 << depth;
     for (i = 0; i < 256; i++) {
         for (j = 0; j < nlevels; j++) {
             thresh = 255 * (2 * j + 1) / (2 * nlevels - 2);
             if (i <= thresh) {
                 quantval = maxval * j / (nlevels - 1);
                 tab[i] = quantval;
 /*                fprintf(stderr, "tab[%d] = %d\n", i, tab[i]); */
                 break;
             }
         }
     }
     return tab;
 }


 /*----------------------------------------------------------------------*
  *   Quantization table for arbitrary thresholding of grayscale images  *
  *----------------------------------------------------------------------*/
 /*!
  *  makeGrayQuantTableArb()
  *
  *      Input:  na (numa of bin boundaries)
  *              outdepth (of colormap: 1, 2, 4 or 8)
  *              &tab (<return> table mapping input gray level to cmap index)
  *              &cmap (<return> colormap)
  *      Return: 0 if OK, 1 on error
  *
  *  Notes:
  *      (1) The number of bins is the count of @na + 1.
  *      (2) The bin boundaries in na must be sorted in increasing order.
  *      (3) The table is an inverse colormap: it maps input gray level
  *          to colormap index (the bin number).
  *      (4) The colormap generated here has quantized values at the
  *          center of each bin.  If you want to use the average gray
  *          value of pixels within the bin, discard the colormap and
  *          compute it using makeGrayQuantColormapArb().
  *      (5) Returns an error if there are not enough levels in the
  *          output colormap for the number of bins.  The number
  *          of bins must not exceed 2^outdepth.
  */
 l_int32
 makeGrayQuantTableArb(NUMA      *na,
                       l_int32    outdepth,
                       l_int32  **ptab,
                       PIXCMAP  **pcmap)
 {
 l_int32   i, j, n, jstart, ave, val;
 l_int32  *tab;
 PIXCMAP  *cmap;

     PROCNAME("makeGrayQuantTableArb");

     if (!ptab)
         return ERROR_INT("&tab not defined", procName, 1);
     *ptab = NULL;
     if (!pcmap)
         return ERROR_INT("&cmap not defined", procName, 1);
     *pcmap = NULL;
     if (!na)
         return ERROR_INT("na not defined", procName, 1);
     n = numaGetCount(na);
     if (n + 1 > (1 << outdepth))
         return ERROR_INT("more bins than cmap levels", procName, 1);

     if ((tab = (l_int32 *)CALLOC(256, sizeof(l_int32))) == NULL)
         return ERROR_INT("calloc fail for tab", procName, 1);
     if ((cmap = pixcmapCreate(outdepth)) == NULL)
         return ERROR_INT("cmap not made", procName, 1);
     *ptab = tab;
     *pcmap = cmap;

         /* First n bins */
     jstart = 0;
     for (i = 0; i < n; i++) {
         numaGetIValue(na, i, &val);
         ave = (jstart + val) / 2;
         pixcmapAddColor(cmap, ave, ave, ave);
         for (j = jstart; j < val; j++)
             tab[j] = i;
         jstart = val;
     }

         /* Last bin */
     ave = (jstart + 255) / 2;
     pixcmapAddColor(cmap, ave, ave, ave);
     for (j = jstart; j < 256; j++)
         tab[j] = n;

     return 0;
 }


 /*!
  *  makeGrayQuantColormapArb()
  *
  *      Input:  pixs (8 bpp)
  *              tab (table mapping input gray level to cmap index)
  *              outdepth (of colormap: 1, 2, 4 or 8)
  *              &cmap (<return> colormap)
  *      Return: 0 if OK, 1 on error
  *
  *  Notes:
  *      (1) The table is a 256-entry inverse colormap: it maps input gray
  *          level to colormap index (the bin number).  It is computed
  *          using makeGrayQuantTableArb().
  *      (2) The colormap generated here has quantized values at the
  *          average gray value of the pixels that are in each bin.
  *      (3) Returns an error if there are not enough levels in the
  *          output colormap for the number of bins.  The number
  *          of bins must not exceed 2^outdepth.
  */
 l_int32
 makeGrayQuantColormapArb(PIX       *pixs,
                          l_int32   *tab,
                          l_int32    outdepth,
                          PIXCMAP  **pcmap)
 {
 l_int32    i, j, index, w, h, d, nbins, wpl, factor, val;
 l_int32   *bincount, *binave, *binstart;
 l_uint32  *line, *data;

     PROCNAME("makeGrayQuantColormapArb");

     if (!pcmap)
         return ERROR_INT("&cmap not defined", procName, 1);
     *pcmap = NULL;
     if (!pixs)
         return ERROR_INT("pixs not defined", procName, 1);
     pixGetDimensions(pixs, &w, &h, &d);
     if (d != 8)
         return ERROR_INT("pixs not 8 bpp", procName, 1);
     if (!tab)
         return ERROR_INT("tab not defined", procName, 1);
     nbins = tab[255] + 1;
     if (nbins > (1 << outdepth))
         return ERROR_INT("more bins than cmap levels", procName, 1);

         /* Find the count and weighted count for each bin */
     if ((bincount = (l_int32 *)CALLOC(nbins, sizeof(l_int32))) == NULL)
         return ERROR_INT("calloc fail for bincount", procName, 1);
     if ((binave = (l_int32 *)CALLOC(nbins, sizeof(l_int32))) == NULL)
         return ERROR_INT("calloc fail for binave", procName, 1);
     factor = (l_int32)(sqrt((l_float64)(w * h) / 30000.) + 0.5);
     factor = L_MAX(1, factor);
     data = pixGetData(pixs);
     wpl = pixGetWpl(pixs);
     for (i = 0; i < h; i += factor) {
         line = data + i * wpl;
         for (j = 0; j < w; j += factor) {
             val = GET_DATA_BYTE(line, j);
             bincount[tab[val]]++;
             binave[tab[val]] += val;
         }
     }

         /* Find the smallest gray values in each bin */
     if ((binstart = (l_int32 *)CALLOC(nbins, sizeof(l_int32))) == NULL)
         return ERROR_INT("calloc fail for binstart", procName, 1);
     for (i = 1, index = 1; i < 256; i++) {
         if (tab[i] < index) continue;
         if (tab[i] == index)
             binstart[index++] = i;
     }

         /* Get the averages.  If there are no samples in a bin, use
 	 * the center value of the bin. */
     *pcmap = pixcmapCreate(outdepth);
     for (i = 0; i < nbins; i++) {
         if (bincount[i])
             val = binave[i] / bincount[i];
         else {  /* no samples in the bin */
             if (i < nbins - 1)
                 val = (binstart[i] + binstart[i + 1]) / 2;
             else  /* last bin */
                 val = (binstart[i] + 255) / 2;
         }
         pixcmapAddColor(*pcmap, val, val, val);
     }

     FREE(bincount);
     FREE(binave);
     FREE(binstart);
     return 0;
 }


 /*--------------------------------------------------------------------*
  *                 Thresholding from 32 bpp rgb to 1 bpp              *
  *--------------------------------------------------------------------*/
 /*!
  *  pixGenerateMaskByBand32()
  *
  *      Input:  pixs (32 bpp)
  *              refval (reference rgb value)
  *              delm (max amount below the ref value for any component)
  *              delp (max amount above the ref value for any component)
  *      Return: pixd (1 bpp), or null on error
  *
  *  Notes:
  *      (1) Generates a 1 bpp mask pixd, the same size as pixs, where
  *          the fg pixels in the mask are those where each component
  *          is within -delm to +delp of the reference value.
  */
 PIX *
 pixGenerateMaskByBand32(PIX    *pixs,
                         l_uint32  refval,
                         l_int32   delm,
                         l_int32   delp)
 {
 l_int32    i, j, w, h, d, wpls, wpld;
 l_int32    rref, gref, bref, rval, gval, bval;
 l_uint32   pixel;
 l_uint32  *datas, *datad, *lines, *lined;
 PIX       *pixd;

     PROCNAME("pixGenerateMaskByBand32");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     pixGetDimensions(pixs, &w, &h, &d);
     if (d != 32)
         return (PIX *)ERROR_PTR("not 32 bpp", procName, NULL);
     if (delm < 0 || delp < 0)
         return (PIX *)ERROR_PTR("delm and delp must be >= 0", procName, NULL);

     extractRGBValues(refval, &rref, &gref, &bref);
     pixd = pixCreate(w, h, 1);
     pixCopyResolution(pixd, pixs);
     datas = pixGetData(pixs);
     wpls = pixGetWpl(pixs);
     datad = pixGetData(pixd);
     wpld = pixGetWpl(pixd);
     for (i = 0; i < h; i++) {
         lines = datas + i * wpls;
         lined = datad + i * wpld;
         for (j = 0; j < w; j++) {
             pixel = lines[j];
             rval = (pixel >> L_RED_SHIFT) & 0xff;
             if (rval < rref - delm || rval > rref + delp)
                 continue;
             gval = (pixel >> L_GREEN_SHIFT) & 0xff;
             if (gval < gref - delm || gval > gref + delp)
                 continue;
             bval = (pixel >> L_BLUE_SHIFT) & 0xff;
             if (bval < bref - delm || bval > bref + delp)
                 continue;
             SET_DATA_BIT(lined, j);
         }
     }

     return pixd;
 }


 /*!
  *  pixGenerateMaskByDiscr32()
  *
  *      Input:  pixs (32 bpp)
  *              refval1 (reference rgb value)
  *              refval2 (reference rgb value)
  *              distflag (L_MANHATTAN_DISTANCE, L_EUCLIDEAN_DISTANCE)
  *      Return: pixd (1 bpp), or null on error
  *
  *  Notes:
  *      (1) Generates a 1 bpp mask pixd, the same size as pixs, where
  *          the fg pixels in the mask are those where the pixel in pixs
  *          is "closer" to refval1 than to refval2.
  *      (2) "Closer" can be defined in several ways, such as:
  *            - manhattan distance (L1)
  *            - euclidean distance (L2)
  *            - majority vote of the individual components
  *          Here, we have a choice of L1 or L2.
  */
 PIX *
 pixGenerateMaskByDiscr32(PIX      *pixs,
                          l_uint32  refval1,
                          l_uint32  refval2,
 			 l_int32   distflag)
 {
 l_int32    i, j, w, h, d, wpls, wpld;
 l_int32    rref1, gref1, bref1, rref2, gref2, bref2, rval, gval, bval;
 l_uint32   pixel, dist1, dist2;
 l_uint32  *datas, *datad, *lines, *lined;
 PIX       *pixd;

     PROCNAME("pixGenerateMaskByDiscr32");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     pixGetDimensions(pixs, &w, &h, &d);
     if (d != 32)
         return (PIX *)ERROR_PTR("not 32 bpp", procName, NULL);
     if (distflag != L_MANHATTAN_DISTANCE && distflag != L_EUCLIDEAN_DISTANCE)
         return (PIX *)ERROR_PTR("invalid distflag", procName, NULL);

     extractRGBValues(refval1, &rref1, &gref1, &bref1);
     extractRGBValues(refval2, &rref2, &gref2, &bref2);
     pixd = pixCreate(w, h, 1);
     pixCopyResolution(pixd, pixs);
     datas = pixGetData(pixs);
     wpls = pixGetWpl(pixs);
     datad = pixGetData(pixd);
     wpld = pixGetWpl(pixd);
     for (i = 0; i < h; i++) {
         lines = datas + i * wpls;
         lined = datad + i * wpld;
         for (j = 0; j < w; j++) {
             pixel = lines[j];
             extractRGBValues(pixel, &rval, &gval, &bval);
             if (distflag == L_MANHATTAN_DISTANCE) {
                 dist1 = L_ABS(rref1 - rval);
                 dist2 = L_ABS(rref2 - rval);
                 dist1 += L_ABS(gref1 - gval);
                 dist2 += L_ABS(gref2 - gval);
                 dist1 += L_ABS(bref1 - bval);
                 dist2 += L_ABS(bref2 - bval);
             }
             else {
                 dist1 = (rref1 - rval) * (rref1 - rval);
                 dist2 = (rref2 - rval) * (rref2 - rval);
                 dist1 += (gref1 - gval) * (gref1 - gval);
                 dist2 += (gref2 - gval) * (gref2 - gval);
                 dist1 += (bref1 - bval) * (bref1 - bval);
                 dist2 += (bref2 - bval) * (bref2 - bval);
             }
             if (dist1 < dist2)
                 SET_DATA_BIT(lined, j);
         }
     }

     return pixd;
 }


 /*----------------------------------------------------------------------*
  *                Histogram-based grayscale quantization                *
  *----------------------------------------------------------------------*/
 /*!
  *  pixGrayQuantFromHisto()
  *
  *      Input:  pixd (<optional> quantized pix with cmap; can be null)
  *              pixs (8 bpp gray input pix; not cmapped)
  *              pixm (<optional> mask over pixels in pixs to quantize)
  *              minfract (minimum fraction of pixels in a set of adjacent
  *                        histo bins that causes the set to be automatically
  *                        set aside as a color in the colormap; must be
  *                        at least 0.01)
  *              maxsize (maximum number of adjacent bins allowed to represent
  *                       a color, regardless of the population of pixels
  *                       in the bins; must be at least 2)
  *      Return: pixd (8 bpp, cmapped), or null on error
  *
  *  Notes:
  *      (1) This is useful for quantizing images with relatively few
  *          colors, but which may have both color and gray pixels.
  *          If there are color pixels, it is assumed that an input
  *          rgb image has been color quantized first so that:
  *            - pixd has a colormap describing the color pixels
  *            - pixm is a mask over the non-color pixels in pixd
  *            - the colormap in pixd, and the color pixels in pixd,
  *              have been repacked to go from 0 to n-1 (n colors)
  *          If there are no color pixels, pixd and pixm are both null,
  *          and all pixels in pixs are quantized to gray.
  *      (2) A 256-entry histogram is built of the gray values in pixs.
  *          If pixm exists, the pixels contributing to the histogram are
  *          restricted to the fg of pixm.  A colormap and LUT are generated
  *          from this histogram.  We break up the array into a set
  *          of intervals, each one constituting a color in the colormap:
  *          An interval is identified by summing histogram bins until
  *          either the sum equals or exceeds the @minfract of the total
  *          number of pixels, or the span itself equals or exceeds @maxsize.
  *          The color of each bin is always an average of the pixels
  *          that constitute it.
  *      (3) Note that we do not specify the number of gray colors in
  *          the colormap.  Instead, we specify two parameters that
  *          describe the accuracy of the color assignments; this and
  *          the actual image determine the number of resulting colors.
  *      (4) If a mask exists and it is not the same size as pixs, make
  *          a new mask the same size as pixs, with the original mask
  *          aligned at the UL corners.  Set all additional pixels
  *          in the (larger) new mask set to 1, causing those pixels
  *          in pixd to be set as gray.
  *      (5) We estimate the total number of colors (color plus gray);
  *          if it exceeds 255, return null.
  */
 PIX *
 pixGrayQuantFromHisto(PIX       *pixd,
                       PIX       *pixs,
                       PIX       *pixm,
                       l_float32  minfract,
                       l_int32    maxsize)
 {
 l_int32    w, h, wd, hd, wm, hm, wpls, wplm, wpld;
 l_int32    nc, nestim, i, j, vals, vald;
 l_int32   *lut;
 l_uint32  *datas, *datam, *datad, *lines, *linem, *lined;
 NUMA      *na;
 PIX       *pixmr;  /* resized mask */
 PIXCMAP   *cmap;

     PROCNAME("pixGrayQuantFromHisto");

     if (!pixs || pixGetDepth(pixs) != 8)
         return (PIX *)ERROR_PTR("pixs undefined or not 8 bpp", procName, NULL);
     if (minfract < 0.01) {
         L_WARNING("minfract < 0.01; setting to 0.05", procName);
         minfract = 0.05;
     }
     if (maxsize < 2) {
         L_WARNING("maxsize < 2; setting to 10", procName);
         maxsize = 10;
     }
     if ((pixd && !pixm) || (!pixd && pixm))
         return (PIX *)ERROR_PTR("(pixd,pixm) not defined together",
                                 procName, NULL);
     pixGetDimensions(pixs, &w, &h, NULL);
     if (pixd) {
         if (pixGetDepth(pixm) != 1)
             return (PIX *)ERROR_PTR("pixm not 1 bpp", procName, NULL);
         if ((cmap = pixGetColormap(pixd)) == NULL)
             return (PIX *)ERROR_PTR("pixd not cmapped", procName, NULL);
         pixGetDimensions(pixd, &wd, &hd, NULL);
         if (w != wd || h != hd)
             return (PIX *)ERROR_PTR("pixs, pixd sizes differ", procName, NULL);
         nc = pixcmapGetCount(cmap);
         nestim = nc + (l_int32)(1.5 * 255 / maxsize);
         fprintf(stderr, "nestim = %d\n", nestim);
         if (nestim > 255) {
             L_ERROR_INT("Estimate %d colors!", procName, nestim);
             return (PIX *)ERROR_PTR("probably too many colors", procName, NULL);
         }
         pixGetDimensions(pixm, &wm, &hm, NULL);
         if (w != wm || h != hm) {  /* resize the mask */
             L_WARNING("mask and dest sizes not equal", procName);
             pixmr = pixCreateNoInit(w, h, 1);
             pixRasterop(pixmr, 0, 0, wm, hm, PIX_SRC, pixm, 0, 0);
             pixRasterop(pixmr, wm, 0, w - wm, h, PIX_SET, NULL, 0, 0);
             pixRasterop(pixmr, 0, hm, wm, h - hm, PIX_SET, NULL, 0, 0);
         }
         else
             pixmr = pixClone(pixm);
     }
     else {
         pixd = pixCreateTemplate(pixs);
         cmap = pixcmapCreate(8);
         pixSetColormap(pixd, cmap);
     }

         /* Use original mask, if it exists, to select gray pixels */
     na = pixGetGrayHistogramMasked(pixs, pixm, 0, 0, 1);

         /* Fill out the cmap with gray colors, and generate the lut
          * for pixel assignment.  Issue a warning on failure.  */
     if (numaFillCmapFromHisto(na, cmap, minfract, maxsize, &lut))
         L_ERROR("ran out of colors in cmap!", procName);
     numaDestroy(&na);

         /* Assign the gray pixels to their cmap indices */
     datas = pixGetData(pixs);
     datad = pixGetData(pixd);
     wpls = pixGetWpl(pixs);
     wpld = pixGetWpl(pixd);
     if (!pixm) {
         for (i = 0; i < h; i++) {
             lines = datas + i * wpls;
             lined = datad + i * wpld;
             for (j = 0; j < w; j++) {
                 vals = GET_DATA_BYTE(lines, j);
                 vald = lut[vals];
                 SET_DATA_BYTE(lined, j, vald);
             }
         }
         FREE(lut);
         return pixd;
     }

     datam = pixGetData(pixmr);
     wplm = pixGetWpl(pixmr);
     for (i = 0; i < h; i++) {
         lines = datas + i * wpls;
         linem = datam + i * wplm;
         lined = datad + i * wpld;
         for (j = 0; j < w; j++) {
             if (!GET_DATA_BIT(linem, j))
                 continue;
             vals = GET_DATA_BYTE(lines, j);
             vald = lut[vals];
             SET_DATA_BYTE(lined, j, vald);
         }
     }
     pixDestroy(&pixmr);
     FREE(lut);
     return pixd;
 }


 /*!
  *  numaFillCmapFromHisto()
  *
  *      Input:  na (histogram of gray values)
  *              cmap (8 bpp cmap, possibly initialized with color value)
  *              minfract (minimum fraction of pixels in a set of adjacent
  *                        histo bins that causes the set to be automatically
  *                        set aside as a color in the colormap; must be
  *                        at least 0.01)
  *              maxsize (maximum number of adjacent bins allowed to represent
  *                       a color, regardless of the population of pixels
  *                       in the bins; must be at least 2)
  *             &lut (<return> lookup table from gray value to colormap index)
  *      Return: 0 if OK, 1 on error
  *
  *  Notes:
  *      (1) This static function must be called from pixGrayQuantFromHisto()
  */
 static l_int32
 numaFillCmapFromHisto(NUMA      *na,
                       PIXCMAP   *cmap,
                       l_float32  minfract,
                       l_int32    maxsize,
                       l_int32  **plut)
 {
 l_int32    mincount, index, sum, wtsum, span, istart, i, val, ret;
 l_int32   *iahisto, *lut;
 l_float32  total;

     PROCNAME("numaFillCmapFromHisto");

     if (!plut)
         return ERROR_INT("&lut not defined", procName, 1);
     *plut = NULL;
     if (!na)
         return ERROR_INT("na not defined", procName, 1);
     if (!cmap)
         return ERROR_INT("cmap not defined", procName, 1);

     numaGetSum(na, &total);
     mincount = (l_int32)(minfract * total);
     iahisto = numaGetIArray(na);
     if ((lut = (l_int32 *)CALLOC(256, sizeof(l_int32))) == NULL)
         return ERROR_INT("lut not made", procName, 1);
     *plut = lut;
     index = pixcmapGetCount(cmap);  /* start with number of colors
                                      * already reserved */

         /* March through, associating colors with sets of adjacent
          * gray levels.  During the process, the LUT that gives
          * the colormap index for each gray level is computed.
          * To complete a color, either the total count must equal
          * or exceed @mincount, or the current span of colors must
          * equal or exceed @maxsize.  An empty span is not converted
          * into a color; it is simply ignored.  When a span is completed for a
          * color, the weighted color in the span is added to the colormap. */
     sum = 0;
     wtsum = 0;
     istart = 0;
     ret = 0;
     for (i = 0; i < 256; i++) {
         lut[i] = index;
         sum += iahisto[i];
         wtsum += i * iahisto[i];
         span = i - istart + 1;
         if (sum < mincount && span < maxsize)
             continue;

         if (sum == 0) {  /* empty span; don't save */
             istart = i + 1;
             continue;
         }

             /* Found new color; sum > 0 */
         val = (l_int32)((l_float32)wtsum / (l_float32)sum + 0.5);
         ret = pixcmapAddColor(cmap, val, val, val);
         istart = i + 1;
         sum = 0;
         wtsum = 0;
         index++;
     }
     if (istart < 256 && sum > 0) {  /* last one */
         span = 256 - istart;
         val = (l_int32)((l_float32)wtsum / (l_float32)sum + 0.5);
         ret = pixcmapAddColor(cmap, val, val, val);
     }

     FREE(iahisto);
     return ret;
 }


 /*----------------------------------------------------------------------*
  *        Color quantize grayscale image using existing colormap        *
  *----------------------------------------------------------------------*/
 /*!
  *  pixGrayQuantFromCmap()
  *
  *      Input:  pixs (8 bpp grayscale without cmap)
  *              cmap (to quantize to; of dest pix)
  *              mindepth (minimum depth of pixd: can be 2, 4 or 8 bpp)
  *      Return: pixd (2, 4 or 8 bpp, colormapped), or null on error
  *
  *  Notes:
  *      (1) In use, pixs is an 8 bpp grayscale image without a colormap.
  *          If there is an existing colormap, a warning is issued and
  *          a copy of the input pixs is returned.
  */
 PIX *
 pixGrayQuantFromCmap(PIX      *pixs,
                      PIXCMAP  *cmap,
                      l_int32   mindepth)
 {
 l_int32    i, j, index, w, h, d, depth, wpls, wpld;
 l_int32    hascolor, vals, vald;
 l_int32   *tab;
 l_uint32  *datas, *datad, *lines, *lined;
 PIXCMAP   *cmapd;
 PIX       *pixd;

     PROCNAME("pixGrayQuantFromCmap");

     if (!pixs)
         return (PIX *)ERROR_PTR("pixs not defined", procName, NULL);
     if (pixGetColormap(pixs) != NULL) {
         L_WARNING("pixs already has a colormap; returning a copy", procName);
         return pixCopy(NULL, pixs);
     }
     pixGetDimensions(pixs, &w, &h, &d);
     if (d != 8)
         return (PIX *)ERROR_PTR("pixs not 8 bpp", procName, NULL);
     if (!cmap)
         return (PIX *)ERROR_PTR("cmap not defined", procName, NULL);
     if (mindepth != 2 && mindepth != 4 && mindepth != 8)
         return (PIX *)ERROR_PTR("invalid mindepth", procName, NULL);

         /* Make sure the colormap is gray */
     pixcmapHasColor(cmap, &hascolor);
     if (hascolor) {
         L_WARNING("Converting colormap colors to gray", procName);
         cmapd = pixcmapColorToGray(cmap, 0.3, 0.5, 0.2);
     }
     else
         cmapd = pixcmapCopy(cmap);

         /* Make LUT into colormap */
     if ((tab = (l_int32 *)CALLOC(256, sizeof(l_int32))) == NULL)
         return (PIX *)ERROR_PTR("tab not made", procName, NULL);
     for (i = 0; i < 256; i++) {
         pixcmapGetNearestGrayIndex(cmapd, i, &index);
         tab[i] = index;
     }

     pixcmapGetMinDepth(cmap, &depth);
     depth = L_MAX(depth, mindepth);
     pixd = pixCreate(w, h, depth);
     pixSetColormap(pixd, cmapd);
     pixCopyResolution(pixd, pixs);
     pixCopyInputFormat(pixd, pixs);
     datas = pixGetData(pixs);
     datad = pixGetData(pixd);
     wpls = pixGetWpl(pixs);
     wpld = pixGetWpl(pixd);
     for (i = 0; i < h; i++) {
         lines = datas + i * wpls;
         lined = datad + i * wpld;
         for (j = 0; j < w; j++) {
             vals = GET_DATA_BYTE(lines, j);
             vald = tab[vals];
             if (depth == 2)
                 SET_DATA_DIBIT(lined, j, vald);
             else if (depth == 4)
                 SET_DATA_QBIT(lined, j, vald);
             else  /* depth == 8 */
                 SET_DATA_BYTE(lined, j, vald);
         }
     }

     FREE(tab);
     return pixd;
 }