// -*- C++ -*- // Copyright 2006-2007 Deutsches Forschungszentrum fuer Kuenstliche Intelligenz // or its licensors, as applicable. // // You may not use this file except under the terms of the accompanying license. // // Licensed under the Apache License, Version 2.0 (the "License"); you // may not use this file except in compliance with the License. You may // obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. // // Project: roughocr -- mock OCR system exercising the interfaces and useful for testing // File: ocr-layout-1cp.cc // Purpose: perform page layout analysis by thresholding the 1D projection // Responsible: tmb // Reviewer: // Primary Repository: // Web Sites: www.iupr.org, www.dfki.de #include "colib.h" #include "imgio.h" #include "imglib.h" #include "ocr-utils.h" #include "ocr-segmentations.h" using namespace ocropus; using namespace iulib; using namespace colib; struct SegmentPageBy1CP : ISegmentPage { ~SegmentPageBy1CP() {} const char *description() { return "segment characters by horizontal projection (assumes single column)\n"; } void init(const char **argv) { // nothing to be done } void segment(intarray &image,bytearray &in) { param_int thigh("thigh",20,"projection threshold"); param_int tlow("tlow",1,"projection threshold"); optional_check_background_is_lighter(in); bytearray binarized; binarize_simple(binarized, in); copy(image,in); for(int i=0;i