1 | #ifndef _theplu_yat_normalizer_z_score_ |
---|
2 | #define _theplu_yat_normalizer_z_score_ |
---|
3 | |
---|
4 | // $Id: Zscore.h 3550 2017-01-03 05:41:02Z peter $ |
---|
5 | |
---|
6 | /* |
---|
7 | Copyright (C) 2008 Jari Häkkinen, Peter Johansson |
---|
8 | Copyright (C) 2009, 2010, 2016 Peter Johansson |
---|
9 | |
---|
10 | This file is part of the yat library, http://dev.thep.lu.se/yat |
---|
11 | |
---|
12 | The yat library is free software; you can redistribute it and/or |
---|
13 | modify it under the terms of the GNU General Public License as |
---|
14 | published by the Free Software Foundation; either version 3 of the |
---|
15 | License, or (at your option) any later version. |
---|
16 | |
---|
17 | The yat library is distributed in the hope that it will be useful, |
---|
18 | but WITHOUT ANY WARRANTY; without even the implied warranty of |
---|
19 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
---|
20 | General Public License for more details. |
---|
21 | |
---|
22 | You should have received a copy of the GNU General Public License |
---|
23 | along with yat. If not, see <http://www.gnu.org/licenses/>. |
---|
24 | */ |
---|
25 | |
---|
26 | #include "utility.h" |
---|
27 | |
---|
28 | #include "yat/statistics/Averager.h" |
---|
29 | #include "yat/statistics/AveragerWeighted.h" |
---|
30 | |
---|
31 | #include "yat/utility/concept_check.h" |
---|
32 | #include "yat/utility/iterator_traits.h" |
---|
33 | |
---|
34 | #include <boost/concept_check.hpp> |
---|
35 | |
---|
36 | namespace theplu { |
---|
37 | namespace yat { |
---|
38 | namespace normalizer { |
---|
39 | |
---|
40 | /** |
---|
41 | \brief Zero mean and unity variance |
---|
42 | |
---|
43 | Shift and scale the values in a range as: \f$ y_i = |
---|
44 | \frac{x_i-m}{s} \f$ where \a m is the mean and \a s is the |
---|
45 | standard deviation. After normalization, the range will have zero |
---|
46 | mean and unity variance. |
---|
47 | |
---|
48 | Type Requirements: |
---|
49 | - \c InputIterator is \ref concept_data_iterator |
---|
50 | - \c InputIterator is \forward_traversal_iterator |
---|
51 | - \c OutputIterator is \writable_iterator |
---|
52 | - \c OutputIterator is \forward_traversal_iterator |
---|
53 | |
---|
54 | \since New in yat 0.5 |
---|
55 | */ |
---|
56 | class Zscore |
---|
57 | { |
---|
58 | public: |
---|
59 | /** |
---|
60 | The element in range [result, result + (last-first)) is |
---|
61 | calculated as result[i] = (first[i] - m) / s where m and std |
---|
62 | are the mean and standard deviation, respectively, of the range |
---|
63 | [first, last). |
---|
64 | |
---|
65 | It is possible to centralize a range "in place"; it is |
---|
66 | permissible for the iterators \a first and \a result to be the |
---|
67 | same. \see std::transform |
---|
68 | */ |
---|
69 | template<class InputIterator, class OutputIterator> |
---|
70 | void operator()(InputIterator first, InputIterator last, |
---|
71 | OutputIterator result) const |
---|
72 | { |
---|
73 | BOOST_CONCEPT_ASSERT((utility::DataIteratorConcept<InputIterator>)); |
---|
74 | BOOST_CONCEPT_ASSERT((utility::DataIteratorConcept<OutputIterator>)); |
---|
75 | |
---|
76 | // needed for weighted_if_any2 |
---|
77 | typename utility::weighted_if_any2<InputIterator, OutputIterator>::type tag; |
---|
78 | normalize(first, last, result, tag); |
---|
79 | } |
---|
80 | |
---|
81 | private: |
---|
82 | template<class ForwardIterator, class OutputIterator> |
---|
83 | void normalize(ForwardIterator first, ForwardIterator last, |
---|
84 | OutputIterator result, |
---|
85 | utility::unweighted_iterator_tag tag) const |
---|
86 | { |
---|
87 | // we need to traverse the input range once in calculating m |
---|
88 | // (and std) and a second time when assigning new values, so |
---|
89 | // single pass iterator will not suffice. |
---|
90 | BOOST_CONCEPT_ASSERT((boost_concepts::ForwardTraversal<ForwardIterator>)); |
---|
91 | |
---|
92 | BOOST_CONCEPT_ASSERT((boost_concepts::WritableIterator<OutputIterator>)); |
---|
93 | |
---|
94 | statistics::Averager a; |
---|
95 | add(a, first, last); |
---|
96 | double m = a.mean(); |
---|
97 | double std = a.std(); |
---|
98 | while (first!=last) { |
---|
99 | *result = (*first - m) / std; |
---|
100 | ++first; |
---|
101 | ++result; |
---|
102 | } |
---|
103 | } |
---|
104 | |
---|
105 | template<class ForwardIterator, class OutputIterator> |
---|
106 | void normalize(ForwardIterator first, ForwardIterator last, |
---|
107 | OutputIterator result, |
---|
108 | utility::weighted_iterator_tag tag) const |
---|
109 | { |
---|
110 | // we need to traverse the input range once in calculating m |
---|
111 | // (and std) and a second time when assigning new values, so |
---|
112 | // single pass iterator will not suffice. |
---|
113 | BOOST_CONCEPT_ASSERT((boost_concepts::ForwardTraversal<ForwardIterator>)); |
---|
114 | |
---|
115 | BOOST_CONCEPT_ASSERT((boost_concepts::WritableIterator<OutputIterator>)); |
---|
116 | // we traverse output range twice |
---|
117 | BOOST_CONCEPT_ASSERT((boost_concepts::ForwardTraversal<OutputIterator>)); |
---|
118 | detail::copy_weight_if_weighted(first, last, result); |
---|
119 | statistics::AveragerWeighted a; |
---|
120 | add(a, first, last); |
---|
121 | double m = a.mean(); |
---|
122 | double std = a.std(); |
---|
123 | utility::iterator_traits<ForwardIterator> in_trait; |
---|
124 | utility::iterator_traits<OutputIterator> out_trait; |
---|
125 | while (first!=last) { |
---|
126 | out_trait.data(result) = (in_trait.data(first) - m) / std; |
---|
127 | ++first; |
---|
128 | ++result; |
---|
129 | } |
---|
130 | } |
---|
131 | }; |
---|
132 | |
---|
133 | }}} // end of namespace normalizer, yat and thep |
---|
134 | #endif |
---|