// -*- C++ -*- // Copyright 2006-2007 Deutsches Forschungszentrum fuer Kuenstliche Intelligenz // or its licensors, as applicable. // // You may not use this file except under the terms of the accompanying license. // // Licensed under the Apache License, Version 2.0 (the "License"); you // may not use this file except in compliance with the License. You may // obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. // // Project: roughocr -- mock OCR system exercising the interfaces and useful for testing // File: kmeans.cc // Purpose: kmeans implementation // Responsible: tmb // Reviewer: // Primary Repository: // Web Sites: www.iupr.org, www.dfki.de #include "colib.h" using namespace colib; namespace ocropus { param_bool verbose_kmeans("verbose_kmeans",1,"output progress report during kmeans computations"); double entropy(intarray &a) { double n = 0; for(int i=0;i &result,narray &vectors,int k,int maxrounds=2,int maxtrials=2) { int nvectors = vectors.length(); double result_score = 0; double means_score; narray< narray > indexes; doublearray dists; intarray counts; narray means; for(int trial=0;trial result_score)) { result.resize(k); for(int i=0;i