source: trunk/c++_tools/utility/WeNNI.cc @ 675

Last change on this file since 675 was 675, checked in by Jari Häkkinen, 17 years ago

References #83. Changing project name to yat. Compilation will fail in this revision.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 2.7 KB
Line 
1// $Id: WeNNI.cc 675 2006-10-10 12:08:45Z jari $
2
3/*
4  Copyright (C) 2004 Jari Häkkinen
5  Copyright (C) 2005 Jari Häkkinen, Peter Johansson
6  Copyright (C) 2006 Jari Häkkinen
7
8  This file is part of the yat library, http://lev.thep.lu.se/trac/yat
9
10  The yat library is free software; you can redistribute it and/or
11  modify it under the terms of the GNU General Public License as
12  published by the Free Software Foundation; either version 2 of the
13  License, or (at your option) any later version.
14
15  The yat library is distributed in the hope that it will be useful,
16  but WITHOUT ANY WARRANTY; without even the implied warranty of
17  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18  General Public License for more details.
19
20  You should have received a copy of the GNU General Public License
21  along with this program; if not, write to the Free Software
22  Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA
23  02111-1307, USA.
24*/
25
26#include "yat/utility/WeNNI.h"
27
28#include "yat/utility/matrix.h"
29#include "yat/utility/stl_utility.h"
30
31#include <algorithm>
32#include <cmath>
33#include <fstream>
34
35namespace theplu {
36namespace utility {
37
38
39  WeNNI::WeNNI(const utility::matrix& matrix,const utility::matrix& flag,
40               const u_int neighbours)
41    : NNI(matrix,flag,neighbours), imputed_data_raw_(matrix)
42  {
43    //estimate();
44  }
45
46
47
48  // \hat{x_{ij}}=\frac{ \sum_{k=1,N} \frac{w_{kj}*x_{kj}}{d_{ki}} }
49  //                   { \sum_{k=1,N} \frac{w_{kj}       }{d_{ki}} }
50  // where N is defined in the paper cited in the NNI class definition
51  // documentation.
52  u_int WeNNI::estimate(void)
53  {
54    for (unsigned int i=0; i<data_.rows(); i++) {
55      // Jari, avoid copying in next line
56      std::vector<std::pair<u_int,double> > distance=calculate_distances(i);
57      std::sort(distance.begin(),distance.end(),
58                pair_value_compare<u_int,double>());
59      bool row_imputed=true;
60      for (unsigned int j=0; j<data_.columns(); j++) {
61        std::vector<u_int> knn=nearest_neighbours(j,distance);
62        double new_value=0.0;
63        double norm=0.0;
64        for (std::vector<u_int>::const_iterator k=knn.begin(); k!=knn.end();
65             ++k) {
66          // Jari, a small number needed here, use something standardized.
67          // Avoid division with zero (perfect match vectors)
68          double d=(distance[*k].second ? distance[*k].second : 1e-10);
69          new_value+=(weight_(distance[*k].first,j) *
70                      data_(distance[*k].first,j)/d);
71          norm+=weight_(distance[*k].first,j)/d;
72        }
73        // No impute if no contributions from neighbours.
74        if (norm){
75          imputed_data_raw_(i,j) = new_value/norm;
76          imputed_data_(i,j)=
77            weight_(i,j)*data_(i,j) + (1-weight_(i,j))* imputed_data_raw_(i,j);
78        }
79        else
80          row_imputed=false;
81      }
82      if (!row_imputed)
83        not_imputed_.push_back(i);
84    }
85    return not_imputed_.size();
86  }
87
88
89}} // of namespace utility and namespace theplu
Note: See TracBrowser for help on using the repository browser.