/*====================================================================* - Copyright (C) 2001 Leptonica. All rights reserved. - - Redistribution and use in source and binary forms, with or without - modification, are permitted provided that the following conditions - are met: - 1. Redistributions of source code must retain the above copyright - notice, this list of conditions and the following disclaimer. - 2. Redistributions in binary form must reproduce the above - copyright notice, this list of conditions and the following - disclaimer in the documentation and/or other materials - provided with the distribution. - - THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS - ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT - LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR - A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL ANY - CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, - EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, - PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR - PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY - OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING - NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS - SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. *====================================================================*/ /* * pageseg_reg.c * * This is a regresssion test for some of the page segmentation * algorithms. You can run some of these algorithms on any selected page * image using prog/pagesegtest1. * Tests are for: * - Generic page segmentation * - Foreground finding * - Greedy whitespace rectangle finder * - Table finder * - Text auto-inversion */ #ifdef HAVE_CONFIG_H #include #endif /* HAVE_CONFIG_H */ #include "allheaders.h" int main(int argc, char **argv) { l_uint8 *data; char *fname; l_int32 i, n, w, h, istable, score; size_t size; BOX *box; BOXA *boxa; PIX *pixs, *pix1, *pix2, *pix3, *pix4, *pix5; PIX *pixhm, *pixtm, *pixtb, *pixdb; PIXA *pixadb; PIXAC *pixac; SARRAY *sa; L_REGPARAMS *rp; #if !defined(HAVE_LIBPNG) L_ERROR("This test requires libpng to run.\n", "pageseg_reg"); exit(77); #endif #if !defined(HAVE_LIBJPEG) L_ERROR("This test requires libjpeg to run.\n", "pageseg_reg"); exit(77); #endif #if !defined(HAVE_LIBTIFF) L_ERROR("This test requires libtiff to run.\n", "pageseg_reg"); exit(77); #endif if (regTestSetup(argc, argv, &rp)) return 1; #if 1 /* Test the generic page segmentation */ pixs = pixRead("pageseg1.tif"); pixadb = pixaCreate(0); pixGetRegionsBinary(pixs, &pixhm, &pixtm, &pixtb, pixadb); pixDestroy(&pixhm); pixDestroy(&pixtm); pixDestroy(&pixtb); n = pixaGetCount(pixadb); for (i = 0; i < n; i++) { pix1 = pixaGetPix(pixadb, i, L_CLONE); regTestWritePixAndCheck(rp, pix1, IFF_PNG); /* 0 - 19 */ pixDestroy(&pix1); } /* Display intermediate images and final segmentation */ if (rp->display) { pix1 = pixaDisplayTiledAndScaled(pixadb, 32, 400, 4, 0, 20, 3); pixDisplay(pix1, 0, 0); pixDestroy(&pix1); pix1 = pixaGetPix(pixadb, 18, L_CLONE); pixDisplay(pix1, 510, 0); pixDestroy(&pix1); pix1 = pixaGetPix(pixadb, 19, L_CLONE); pixDisplay(pix1, 1140, 0); pixDestroy(&pix1); } pixaDestroy(&pixadb); /* Test foreground finding */ sa = getSortedPathnamesInDirectory(".", "lion-page", 0, 0); n = sarrayGetCount(sa); boxa = boxaCreate(n); box = boxCreate(0, 0, 0, 0); /* invalid box */ boxaInitFull(boxa, box); /* Init to invalid boxes */ boxDestroy(&box); pixac = pixacompCreate(n); for (i = 0; i < n; i++) { fname = sarrayGetString(sa, i, L_NOCOPY); pix1 = pixRead(fname); box = pixFindPageForeground(pix1, 170, 70, 30, 0, pixac); if (!box) { pixDestroy(&pix1); continue; } boxaReplaceBox(boxa, i, box); pixDestroy(&pix1); } boxaWriteMem(&data, &size, boxa); regTestWriteDataAndCheck(rp, data, size, "ba"); /* 20 */ boxaDestroy(&boxa); lept_free(data); l_pdfSetDateAndVersion(0); pixacompConvertToPdfData(pixac, 0, 1.0, L_DEFAULT_ENCODE, 0, "Page foreground", &data, &size); regTestWriteDataAndCheck(rp, data, size, "pdf"); /* 21 */ lept_free(data); sarrayDestroy(&sa); pixacompDestroy(&pixac); /* Test the greedy rectangle finder for white space */ pix1 = pixScale(pixs, 0.5, 0.5); pixFindLargeRectangles(pix1, 0, 20, &boxa, &pixdb); regTestWritePixAndCheck(rp, pixdb, IFF_PNG); /* 22 */ pixDisplayWithTitle(pixdb, 0, 700, NULL, rp->display); pixDestroy(&pixs); pixDestroy(&pix1); pixDestroy(&pixdb); boxaDestroy(&boxa); /* Test the table finder */ pix1 = pixRead("table.15.tif"); pixadb = pixaCreate(0); pixDecideIfTable(pix1, NULL, L_PORTRAIT_MODE, &score, pixadb); istable = (score >= 2) ? 1 : 0; regTestCompareValues(rp, 1.0, istable, 0.0); /* 23 */ pix2 = pixaDisplayTiledInRows(pixadb, 32, 2000, 1.0, 0, 30, 2); regTestWritePixAndCheck(rp, pix2, IFF_PNG); /* 24 */ pixDisplayWithTitle(pix2, 620, 700, NULL, rp->display); pixDestroy(&pix1); pixDestroy(&pix2); pixaDestroy(&pixadb); pix1 = pixRead("table.27.tif"); pixadb = pixaCreate(0); pixDecideIfTable(pix1, NULL, L_PORTRAIT_MODE, &score, pixadb); istable = (score >= 2) ? 1 : 0; regTestCompareValues(rp, 1.0, istable, 0.0); /* 25 */ pix2 = pixaDisplayTiledInRows(pixadb, 32, 2000, 1.0, 0, 30, 2); regTestWritePixAndCheck(rp, pix2, IFF_PNG); /* 26 */ pixDisplayWithTitle(pix2, 1000, 700, NULL, rp->display); pixDestroy(&pix1); pixDestroy(&pix2); pixaDestroy(&pixadb); pix1 = pixRead("table.150.png"); pixadb = pixaCreate(0); pixDecideIfTable(pix1, NULL, L_PORTRAIT_MODE, &score, pixadb); istable = (score >= 2) ? 1 : 0; regTestCompareValues(rp, 1.0, istable, 0.0); /* 27 */ pix2 = pixaDisplayTiledInRows(pixadb, 32, 2000, 1.0, 0, 30, 2); regTestWritePixAndCheck(rp, pix2, IFF_PNG); /* 28 */ pixDisplayWithTitle(pix2, 1300, 700, NULL, rp->display); pixDestroy(&pix1); pixDestroy(&pix2); pixaDestroy(&pixadb); pix1 = pixRead("toc.99.tif"); /* not a table */ pixadb = pixaCreate(0); pixDecideIfTable(pix1, NULL, L_PORTRAIT_MODE, &score, pixadb); istable = (score >= 2) ? 1 : 0; regTestCompareValues(rp, 0.0, istable, 0.0); /* 29 */ pix2 = pixaDisplayTiledInRows(pixadb, 32, 2000, 1.0, 0, 30, 2); regTestWritePixAndCheck(rp, pix2, IFF_PNG); /* 30 */ pixDisplayWithTitle(pix2, 1600, 700, NULL, rp->display); pixDestroy(&pix1); pixDestroy(&pix2); pixaDestroy(&pixadb); #endif /* Tests of auto-inversion of text */ pix1 = pixRead("zanotti-78.jpg"); pix2 = pixConvertRGBToLuminance(pix1); pixadb = pixaCreate(0); pixaAddPix(pixadb, pix2, L_COPY); pixGetDimensions(pix2, &w, &h, NULL); pixRasterop(pix2, 0.2 * w, 0.08 * h, 0.4 * w, 0.23 * h, PIX_NOT(PIX_DST), NULL, 0, 0); pixRasterop(pix2, 0.6 * w, 0.5 * h, 0.2 * w, 0.15 * h, PIX_NOT(PIX_DST), NULL, 0, 0); pix3 = pixAutoPhotoinvert(pix2, 128, &pix4, pixadb); pix5 = pixaDisplayTiledInColumns(pixadb, 5, 0.3, 20, 2); regTestWritePixAndCheck(rp, pix2, IFF_PNG); /* 31 */ regTestWritePixAndCheck(rp, pix4, IFF_PNG); /* 32 */ regTestWritePixAndCheck(rp, pix5, IFF_PNG); /* 33 */ pixDisplayWithTitle(pix5, 1750, 200, NULL, rp->display); pixaDestroy(&pixadb); pixDestroy(&pix1); pixDestroy(&pix2); pixDestroy(&pix3); pixDestroy(&pix4); pixDestroy(&pix5); pix1 = pixRead("invertedtext.tif"); pixadb = pixaCreate(0); pixaAddPix(pixadb, pix1, L_COPY); pix2 = pixAutoPhotoinvert(pix1, 128, &pix3, pixadb); pix4 = pixaDisplayTiledInColumns(pixadb, 5, 1.0, 20, 2); regTestWritePixAndCheck(rp, pix1, IFF_PNG); /* 34 */ regTestWritePixAndCheck(rp, pix3, IFF_PNG); /* 35 */ regTestWritePixAndCheck(rp, pix4, IFF_PNG); /* 36 */ pixDisplayWithTitle(pix4, 1750, 0, NULL, rp->display); pixDestroy(&pix1); pixDestroy(&pix2); pixDestroy(&pix3); pixDestroy(&pix4); return regTestCleanup(rp); }