/** * \file KMData.cpp \brief Holds data points to cluster using k-means * * Copyright 2007-2010 IMP Inventors. All rights reserved. * */ #include #include #include #include IMPSTATISTICS_BEGIN_NAMESPACE KMData::KMData(int d, int n) : dim_(d) { points_ = allocate_points(n,dim_); } KMData::~KMData() { deallocate_points(points_); } KMPoint KMData::sample_center(double offset){ KMPoint *sampled_p = (*points_)[internal::random_int(points_->size())]; if (offset == 0.) { return *sampled_p; } KMPoint p; for(int i=0;isize()<size(), "not enough points to sample from"); std::vector sampled_ind; for (int i = 0; i < k; i++) { int ri = internal::random_int(points_->size()); if (!allow_duplicate) { bool dup_found; do { dup_found = false; // search for duplicates for (int j = 0; j < i; j++) { if (sampled_ind[j] == ri) { dup_found = true; ri = internal::random_int(points_->size()); break; } } } while (dup_found); } sampled_ind.push_back(ri); KMPoint *p = new KMPoint(); KMPoint *copied_p = (*points_)[ri]; for(int j=0;jpush_back((*copied_p)[j]+internal::random_uniform(-1.,1)*offset); } sample->push_back(p); } IMP_LOG(VERBOSE,"KMData::sampled centers : " <size()<size();i++) { KMPoint *p = new KMPoint(); copy_point((*from)[i],p); to->push_back(p); } } void print_point(const KMPoint &p,std::ostream &out) { out << "[ "; for (unsigned int i = 0; i < p.size(); i++) { out << std::setw(8) << p[i] <<" "; } out << " ]"; } void print_points(const std::string &title,const KMPointArray &ps, std::ostream &out) { out << " (" << title << ":\n"; for (unsigned int i = 0; i < ps.size(); i++) { out << " " << i << "\t"; print_point(*(ps[i]), out); out << "\n"; } out << " )" << std::endl; } IMPSTATISTICS_END_NAMESPACE