annotate lib/StatisticsUtil.pm @ 1:2abf0d43254d draft

Uploaded
author deepakjadmin
date Wed, 20 Jan 2016 09:10:43 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1 package StatisticsUtil;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
2 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
3 # $RCSfile: StatisticsUtil.pm,v $
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
4 # $Date: 2015/02/28 20:47:18 $
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
5 # $Revision: 1.41 $
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
6 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
7 # Author: Manish Sud <msud@san.rr.com>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
8 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
9 # Copyright (C) 2015 Manish Sud. All rights reserved.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
10 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
11 # This file is part of MayaChemTools.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
12 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
13 # MayaChemTools is free software; you can redistribute it and/or modify it under
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
14 # the terms of the GNU Lesser General Public License as published by the Free
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
15 # Software Foundation; either version 3 of the License, or (at your option) any
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
16 # later version.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
17 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
18 # MayaChemTools is distributed in the hope that it will be useful, but without
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
19 # any warranty; without even the implied warranty of merchantability of fitness
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
20 # for a particular purpose. See the GNU Lesser General Public License for more
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
21 # details.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
22 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
23 # You should have received a copy of the GNU Lesser General Public License
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
24 # along with MayaChemTools; if not, see <http://www.gnu.org/licenses/> or
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
25 # write to the Free Software Foundation Inc., 59 Temple Place, Suite 330,
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
26 # Boston, MA, 02111-1307, USA.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
27 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
28
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
29 use strict;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
30 use Exporter;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
31
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
32 use vars qw(@ISA @EXPORT @EXPORT_OK %EXPORT_TAGS);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
33
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
34 @ISA = qw(Exporter);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
35 @EXPORT = qw(Average AverageDeviation Covariance Correlation Euclidean Factorial FactorialDivison GeometricMean Frequency HarmonicMean KLargest KSmallest Kurtosis Maximum Minimum Mean Median Mode PearsonCorrelation Permutations Product Range RSquare Skewness Sum SumOfSquares StandardDeviation StandardDeviationN StandardError Standardize StandardScores StandardScoresN TrimMean Variance VarianceN);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
36 @EXPORT_OK = qw();
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
37 %EXPORT_TAGS = (all => [@EXPORT, @EXPORT_OK]);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
38
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
39 # Compute the mean of an array of numbers
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
40 sub Average {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
41 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
42 return Mean($XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
43 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
44
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
45 # Compute the average of the absolute deviation of an array of numbers: SUM( ABS(x[i] - Xmean) ) / n
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
46 sub AverageDeviation {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
47 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
48
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
49 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
50 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
51 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
52 my($AverageDeviation, $Mean, $Value, $SumOfDeviations);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
53
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
54 $AverageDeviation = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
55 $Mean = Mean($XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
56 foreach $Value (@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
57 $SumOfDeviations += abs($Value - $Mean);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
58 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
59 $AverageDeviation = $SumOfDeviations / @$XArrayRef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
60
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
61 return $AverageDeviation;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
62 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
63
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
64 # Compute correlation coefficient between two arrays of numbers
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
65 sub Correlation {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
66 my($XArrayRef, $YArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
67 return PearsonCorrelation($XArrayRef, $YArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
68 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
69
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
70 # Compute the covariance between two arrays of numbers: SUM( (x[i] - Xmean) (y[i] - Ymean) ) / n
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
71 sub Covariance {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
72 my($XArrayRef, $YArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
73
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
74 if (!(@$XArrayRef && @$YArrayRef && (@$XArrayRef == @$YArrayRef))) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
75 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
76 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
77 my($Covariance, $XMean, $YMean, $Index, $ProductOfDeviations);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
78
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
79 $Covariance = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
80 $XMean = Mean($XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
81 $YMean = Mean($YArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
82 $ProductOfDeviations = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
83 for $Index (0 .. $#{@$XArrayRef}) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
84 $ProductOfDeviations += (($XArrayRef->[$Index] - $XMean) * ($YArrayRef->[$Index] - $YMean));
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
85 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
86 $Covariance = $ProductOfDeviations / @$XArrayRef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
87 return $Covariance;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
88 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
89
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
90 # Compute the euclidean distance of an array of numbers: SQRT( SUM( x[i] ** 2) )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
91 sub Euclidean {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
92 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
93
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
94 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
95 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
96 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
97 my($SumOfSquares);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
98
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
99 $SumOfSquares = SumOfSquares($XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
100
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
101 return sqrt $SumOfSquares;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
102 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
103
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
104 # Compute factorial of a number...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
105 sub Factorial {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
106 my($Num) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
107
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
108 return _Factorial($Num, 1);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
109 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
110
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
111 # Perform factorial division of two numbers...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
112 sub FactorialDivison {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
113 my($Numerator, $Denominator) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
114
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
115 # Only works for integer numbers...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
116 if ($Numerator <= 0 || ($Numerator != int($Numerator)) ||
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
117 $Denominator <= 0 || ($Denominator != int($Denominator)) ) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
118 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
119 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
120 my($LargerNum, $SmallerNum, $Result);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
121 $LargerNum = ($Numerator > $Denominator) ? $Numerator : $Denominator;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
122 $SmallerNum = ($Numerator < $Denominator) ? $Numerator : $Denominator;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
123
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
124 $Result = _Factorial($LargerNum, $SmallerNum);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
125 if ($Numerator < $Denominator) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
126 $Result = 1/$Result;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
127 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
128 return $Result;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
129 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
130
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
131 # Calculate factorial of a number upto a specific limit...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
132 sub _Factorial {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
133 my($Num, $Limit) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
134
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
135 # Only works for integer numbers...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
136 if ($Num <= 0 || ($Num != int($Num)) || $Limit < 1) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
137 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
138 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
139
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
140 my($Result) = 1;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
141
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
142 while ($Num > $Limit) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
143 $Result *= $Num;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
144 $Num--;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
145 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
146 return $Result;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
147 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
148
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
149 # Generate all possible permuations or a specific permutations of items in an array
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
150 # and return a reference to an array containing array references to generated permuations...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
151 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
152 # This alogrithm is based on the example provided by Mark Jason-Dominus, and is available
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
153 # at CPAN as mjd_permute standalone script.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
154 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
155 sub Permutations {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
156 my(@DataToPermute) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
157 my($PermutationNum, $NumOfPermutations, @Permutations);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
158
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
159 if (!@DataToPermute) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
160 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
161 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
162
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
163 @Permutations = ();
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
164 $NumOfPermutations = Factorial(scalar @DataToPermute);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
165
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
166 for ($PermutationNum = 0; $PermutationNum < $NumOfPermutations; $PermutationNum++) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
167 my @Permutation = @DataToPermute[_PermutationNumToPermutation($PermutationNum, $#DataToPermute)];
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
168 push @Permutations, \@Permutation;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
169 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
170
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
171 return \@Permutations;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
172 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
173
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
174 # Generte Nth permutation for a collection of specific size...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
175 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
176 sub _PermutationNumToPermutation {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
177 my($Num, $Size) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
178
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
179 return _PatternToPermutation(_PermutationNumToPattern($Num, $Size));
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
180 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
181
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
182 # Generate Nth pattern for a collection of specific size...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
183 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
184 sub _PermutationNumToPattern {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
185 my($Num, $Size) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
186 my($Index, @Pattern);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
187
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
188 $Index = 1;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
189
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
190 while ($Index <= $Size + 1) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
191 push @Pattern, $Num % $Index;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
192 $Num = int($Num/$Index);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
193 $Index++;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
194 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
195
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
196 return @Pattern;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
197 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
198
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
199 # Generate permutation of integers from pattern...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
200 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
201 sub _PatternToPermutation {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
202 my(@Pattern) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
203 my(@Source, @Permutation);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
204
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
205 @Source = (0 .. $#Pattern);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
206
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
207 while (@Pattern) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
208 push @Permutation, splice(@Source, (pop @Pattern), 1);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
209 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
210
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
211 return @Permutation;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
212 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
213
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
214 # Compute the frequency of occurance of values in an array of numbers. Three different
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
215 # invocation methods are supported:
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
216 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
217 # Frequency(\@ArrayRef) : Using the smallest and largest values, group the numbers into
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
218 # 10 bins.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
219 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
220 # Frequency(\@ArrayRef, $NumOfBins) : Using the smallest and largest values, group the
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
221 # numbers into specified bins.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
222 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
223 # Frequency(\@ArrayRef, \@BinRange): Use bin range to goup the values into different bins.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
224 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
225 # A hash array is returned with keys and values representing range and frequency values respectively.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
226 # The frequency value for a specific key corresponds to all the values which are greater than
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
227 # the previous key and less than or equal to the current key. A key value representing maximum value is
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
228 # added for generating frequency distribution for specific number of bins, and whenever the maximum
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
229 # array value is greater than the maximum specified in bin range, it is also added to bin range.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
230 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
231 sub Frequency {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
232 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
233
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
234 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
235 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
236 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
237
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
238 my($BinRange, $NumOfBins, $BinRangeSpecified);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
239
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
240 $BinRangeSpecified = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
241 $NumOfBins = 10;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
242 if (@_ == 2) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
243 if (ref($_[1]) eq 'ARRAY') {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
244 $BinRange = $_[1];
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
245 if (!(@$BinRange && (@$BinRange > 1))) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
246 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
247 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
248 # Make sure the bin range contains values in increasing order...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
249 my($Index1, $Index2);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
250 for $Index1 (0 .. $#{@$BinRange}) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
251 for $Index2 (($Index1 + 1) .. $#{@$BinRange}) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
252 if ($BinRange->[$Index1] >= $BinRange->[$Index2]) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
253 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
254 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
255 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
256 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
257 $BinRangeSpecified = 1;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
258 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
259 else {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
260 $NumOfBins = $_[1];
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
261 if ($NumOfBins <= 1) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
262 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
263 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
264 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
265 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
266
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
267 # Setup range keys...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
268 my(@RangeKeys);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
269 @RangeKeys = ();
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
270
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
271 my($MinValue, $MaxValue) = Range($XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
272 if ($BinRangeSpecified) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
273 push @RangeKeys, @$BinRange;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
274 if ($MaxValue > $RangeKeys[$#RangeKeys]) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
275 push @RangeKeys, $MaxValue;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
276 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
277 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
278 else {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
279 my($MinValue, $MaxValue) = Range($XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
280 my($Interval) = ($MaxValue - $MinValue)/$NumOfBins;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
281 my($KeyValue) = $MinValue + $Interval;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
282 while ($KeyValue < $MaxValue) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
283 push @RangeKeys, $KeyValue;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
284 $KeyValue += $Interval;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
285 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
286 push @RangeKeys, $MaxValue;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
287 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
288
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
289 #Setup frequency hash array...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
290 my(%FrequencyMap);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
291 %FrequencyMap = ();
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
292
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
293 %FrequencyMap = map { $_ => 0 } @RangeKeys;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
294
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
295 # Count values...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
296 my($Key, $Value);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
297
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
298 VALUE: for $Value (@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
299 for $Key (@RangeKeys) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
300 if ($Value <= $Key) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
301 $FrequencyMap{$Key} += 1;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
302 next VALUE;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
303 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
304 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
305 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
306 return (%FrequencyMap);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
307 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
308
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
309 # Compute the geometric mean of an array of numbers: NthROOT( PRODUCT(x[i]) )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
310 sub GeometricMean {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
311 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
312
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
313 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
314 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
315 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
316 my($Mean, $Product, $Value);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
317 $Product = 1;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
318 foreach $Value (@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
319 if ($Value <= 0 ) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
320 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
321 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
322 $Product *= $Value;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
323 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
324 $Mean = $Product ** (1 / @$XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
325 return $Mean;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
326 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
327
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
328 # Compute the harmonic mean of an array of numbers: 1 / ( SUM(1/x[i]) / n )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
329 sub HarmonicMean {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
330 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
331
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
332 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
333 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
334 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
335 my($Mean, $Sum, $Value);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
336 $Sum = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
337 foreach $Value (@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
338 if ($Value <= 0 ) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
339 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
340 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
341 $Sum += 1/$Value;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
342 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
343 $Mean = 1/($Sum/@$XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
344 return $Mean;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
345 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
346
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
347 # Return the k-largest value from an array of numbers
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
348 sub KLargest {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
349 my($XArrayRef, $K) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
350
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
351 if (!(@$XArrayRef && ($K > 0) && ($K <= @$XArrayRef))) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
352 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
353 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
354 my($KLargest, @SortedXArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
355 @SortedXArray = sort { $b <=> $a } @$XArrayRef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
356 $KLargest = $SortedXArray[$K - 1];
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
357 return $KLargest;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
358 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
359
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
360 # Return the k-smallest value from an array of numbers
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
361 sub KSmallest {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
362 my($XArrayRef, $K) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
363
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
364 if (!(@$XArrayRef && ($K > 0) && ($K <= @$XArrayRef))) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
365 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
366 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
367 my($KSmallest, @SortedXArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
368 @SortedXArray = sort { $a <=> $b } @$XArrayRef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
369 $KSmallest = $SortedXArray[$K - 1];
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
370 return $KSmallest;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
371 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
372
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
373 # Compute the kurtosis of an array of numbers:
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
374 # [ {n(n + 1)/(n - 1)(n - 2)(n - 3)} SUM{ ((x[i] - Xmean)/STDDEV)^4 } ] - {3((n - 1)^2)}/{(n - 2)(n-3)}
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
375 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
376 sub Kurtosis {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
377 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
378
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
379 if (!@$XArrayRef || ((@$XArrayRef - 3) <= 0)) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
380 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
381 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
382 my($Kurtosis, $Mean, $StandardDeviation, $Value);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
383 $Mean = Mean($XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
384 if (!defined $Mean) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
385 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
386 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
387 $StandardDeviation = StandardDeviation($XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
388 if (!(defined $StandardDeviation && $StandardDeviation != 0)) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
389 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
390 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
391
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
392 my($SumOfScores, $SampleSize);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
393 $SumOfScores = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
394 for $Value (@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
395 $SumOfScores += (($Value - $Mean)/$StandardDeviation) ** 4;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
396 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
397 $SampleSize = @$XArrayRef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
398 $Kurtosis = ((($SampleSize * ($SampleSize + 1))/(($SampleSize - 1) * ($SampleSize - 2) * ($SampleSize - 3))) * $SumOfScores) - ((3 * (($SampleSize - 1) ** 2))/(($SampleSize - 2) * ($SampleSize - 3)));
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
399 return $Kurtosis;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
400 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
401
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
402 # Return the smallest value from an array of numbers
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
403 sub Minimum {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
404 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
405 return KSmallest($XArrayRef, 1);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
406 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
407
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
408 # Return the largest value from an array of numbers
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
409 sub Maximum {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
410 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
411 return KLargest($XArrayRef, 1);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
412 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
413
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
414 # Compute the mean of an array of numbers: SUM( x[i] ) / n
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
415 sub Mean {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
416 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
417
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
418 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
419 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
420 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
421 my($Mean, $Sum, $Value);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
422 $Sum = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
423 foreach $Value (@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
424 $Sum += $Value;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
425 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
426 $Mean = $Sum / @$XArrayRef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
427 return $Mean;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
428 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
429
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
430 # Compute the median value of an array of numbers. For an even number array, it's
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
431 # the average of two middle values.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
432 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
433 # For even values of n: Xsorted[(n - 1)/2 + 1]
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
434 # For odd values of n: (Xsorted[n/2] + Xsorted[n/2 + 1])/2
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
435 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
436 sub Median {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
437 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
438
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
439 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
440 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
441 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
442 my($Median, @SortedXArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
443 $Median = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
444 @SortedXArray = sort { $a <=> $b } @$XArrayRef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
445 if (@$XArrayRef % 2) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
446 my($MidIndex);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
447 $MidIndex = int(@SortedXArray - 1)/2;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
448 $Median = $SortedXArray[$MidIndex];
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
449 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
450 else {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
451 # Even number array...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
452 my($MidPosition);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
453 $MidPosition = int(@SortedXArray / 2);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
454 $Median = ($SortedXArray[$MidPosition - 1] + $SortedXArray[$MidPosition]) / 2;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
455 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
456 return $Median;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
457 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
458
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
459 # Return the most frequently occuring value in an array of numbers
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
460 sub Mode {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
461 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
462
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
463 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
464 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
465 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
466 my($Value, %ValueToCountMap, @CountList, @SortedCountList);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
467 %ValueToCountMap = ();
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
468 @CountList = ();
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
469 @SortedCountList = ();
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
470 for $Value (@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
471 if (exists $ValueToCountMap{$Value}) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
472 $ValueToCountMap{$Value} += 1;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
473 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
474 else {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
475 $ValueToCountMap{$Value} = 1;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
476 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
477 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
478 for $Value (keys %ValueToCountMap) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
479 push @CountList, $ValueToCountMap{$Value};
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
480 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
481 @SortedCountList = sort { $b <=> $a } @CountList;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
482
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
483 # Make sure the frequency of mode value is greater than one and check for
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
484 # multiple modes as well...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
485 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
486 my($ModeCount, $ModeValue);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
487 $ModeCount = $SortedCountList[0];
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
488 if ($ModeCount <= 1) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
489 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
490 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
491 # Get the first mode value...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
492 VALUE: for $Value (keys %ValueToCountMap) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
493 if ($ValueToCountMap{$Value} == $ModeCount) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
494 $ModeValue = $Value;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
495 # Set it to zero to skip it next time...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
496 $ValueToCountMap{$Value} = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
497 last VALUE;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
498 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
499 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
500
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
501 if (wantarray) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
502 # Retrieve all the modes...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
503 my(@Modes, $Count);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
504 @Modes = ();
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
505 push @Modes, $ModeValue;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
506 for $Count (@SortedCountList) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
507 if ($Count == $ModeCount) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
508 VALUE: for $Value (keys %ValueToCountMap) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
509 if ($ValueToCountMap{$Value} == $ModeCount) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
510 push @Modes, $Value;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
511 # Set it to zero to skip it next time...
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
512 $ValueToCountMap{$Value} = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
513 last VALUE;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
514 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
515 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
516 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
517 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
518 return sort {$b <=> $a} @Modes;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
519 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
520 else {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
521 return $ModeValue;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
522 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
523 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
524
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
525
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
526 # Compute the Pearson correlation coefficient between two arrays of numbers:
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
527 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
528 # SUM( (x[i] - Xmean)(y[i] - Ymean) ) / SQRT( SUM( (x[i] - Xmean)^2 )(SUM( (y[i] - Ymean)^2 )) )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
529 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
530 # It returns values in the range from -1.0 to 1.0
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
531 sub PearsonCorrelation {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
532 my($XArrayRef, $YArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
533
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
534 if (!(@$XArrayRef && @$YArrayRef && (@$XArrayRef == @$YArrayRef))) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
535 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
536 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
537 my($Correlation, $XMean, $YMean, $Index, $XValueDeviation, $YValueDeviation, $SquareOfXDeviations, $SquareOfYDeviations, $ProductOfDeviations);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
538
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
539 $Correlation = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
540 $XMean = Mean($XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
541 $YMean = Mean($YArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
542 $ProductOfDeviations = 0; $SquareOfXDeviations = 0; $SquareOfYDeviations = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
543 for $Index (0 .. $#{@$XArrayRef}) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
544 $XValueDeviation = $XArrayRef->[$Index] - $XMean;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
545 $YValueDeviation = $YArrayRef->[$Index] - $YMean;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
546 $ProductOfDeviations += ($XValueDeviation * $YValueDeviation);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
547 $SquareOfXDeviations += $XValueDeviation ** 2;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
548 $SquareOfYDeviations += $YValueDeviation ** 2;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
549 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
550 $Correlation = $ProductOfDeviations / sqrt($SquareOfXDeviations * $SquareOfYDeviations);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
551 return $Correlation;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
552 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
553
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
554 # Return the smallest and largest values from an array of numbers
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
555 sub Range {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
556 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
557
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
558 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
559 return (undef, undef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
560 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
561 my($Smallest, $Largest, @SortedXArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
562 @SortedXArray = sort { $a <=> $b } @$XArrayRef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
563 $Smallest = $SortedXArray[0];
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
564 $Largest = $SortedXArray[$#SortedXArray];
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
565 return ($Smallest, $Largest);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
566 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
567
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
568 # Compute square of the Pearson correlation coefficient between two arrays of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
569 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
570 sub RSquare {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
571 my($XArrayRef, $YArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
572 my($RSquare, $Correlation);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
573
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
574 $RSquare = undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
575 $Correlation = PearsonCorrelation($XArrayRef, $YArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
576 if (defined $Correlation) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
577 $RSquare = $Correlation ** 2;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
578 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
579 return $RSquare;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
580 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
581
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
582 # Compute the skewness of an array of numbers:
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
583 # {n/(n - 1)(n - 2)} SUM{ ((x[i] - Xmean)/STDDEV)^3 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
584 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
585 sub Skewness {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
586 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
587
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
588 if (!@$XArrayRef || ((@$XArrayRef - 2) <= 0)) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
589 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
590 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
591 my($Skewness, $Mean, $StandardDeviation, $Value);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
592 $Mean = Mean($XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
593 if (!defined $Mean) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
594 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
595 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
596 $StandardDeviation = StandardDeviation($XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
597 if (!(defined $StandardDeviation && $StandardDeviation != 0)) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
598 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
599 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
600
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
601 my($SumOfScores, $SampleSize);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
602 $SumOfScores = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
603 for $Value (@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
604 $SumOfScores += (($Value - $Mean)/$StandardDeviation) ** 3;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
605 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
606 $SampleSize = @$XArrayRef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
607 $Skewness = ($SampleSize/(($SampleSize - 1) * ($SampleSize - 2) )) * $SumOfScores;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
608 return $Skewness;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
609 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
610
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
611 # Compute the standard deviation of an array of numbers
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
612 sub StandardDeviation {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
613 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
614 return _CalculateStandardDeviation($XArrayRef, 2);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
615 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
616
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
617 # Compute the standard deviation of an array of numbers representing entire population
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
618 sub StandardDeviationN {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
619 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
620 return _CalculateStandardDeviation($XArrayRef, 1);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
621 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
622
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
623 # Compute the standard deviation of an array of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
624 # Mode 1: SQRT ( SUM( (x[i] - mean)^2 ) / n )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
625 # Mode 2: SQRT ( SUM( (x[i] - mean)^2 ) / (n - 1) )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
626 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
627 sub _CalculateStandardDeviation {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
628 my($XArrayRef, $Mode) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
629
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
630 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
631 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
632 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
633 my($StandardDeviation, $Value, $SquareOfDeviations, $Mean, $N);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
634
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
635 $StandardDeviation = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
636 $Mean = Mean($XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
637 $SquareOfDeviations = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
638 foreach $Value (@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
639 $SquareOfDeviations += ($Value - $Mean) ** 2;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
640 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
641 $N = ($Mode == 1) ? @$XArrayRef : (@$XArrayRef - 1);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
642 $StandardDeviation = sqrt($SquareOfDeviations / $N);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
643
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
644 return $StandardDeviation;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
645 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
646
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
647 # Compute the standard error using standard deviation and sample size
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
648 sub StandardError {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
649 my($StandardDeviation, $Count) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
650
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
651 if ($Count <= 0) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
652 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
653 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
654 my($StandardError);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
655 $StandardError = $StandardDeviation / sqrt($Count);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
656
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
657 return $StandardError;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
658 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
659
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
660 # Standardize the value using mean and standard deviation
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
661 sub Standardize {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
662 my($Value, $Mean, $StandardDeviation) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
663
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
664 if ($StandardDeviation <= 0) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
665 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
666 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
667 my($StandardizedValue);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
668 $StandardizedValue = ($Value - $Mean)/$StandardDeviation;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
669
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
670 return $StandardizedValue;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
671 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
672
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
673 # Compute the standard deviation above the mean for an array of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
674 sub StandardScores {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
675 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
676 return _CalculateStandardScores($XArrayRef, 2);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
677 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
678
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
679 # Compute the standard deviation above the mean for an array of numbers representing entire population
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
680 sub StandardScoresN {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
681 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
682 return _CalculateStandardScores($XArrayRef, 1);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
683 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
684
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
685 # Compute the standard deviation above the mean for an array of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
686 # Mode 1: (x[i] - mean) / n
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
687 # Mode 2: (x[i] - mean) / (n - 1)
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
688 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
689 sub _CalculateStandardScores {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
690 my($XArrayRef, $Mode) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
691
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
692 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
693 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
694 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
695 my(@StandardScores, $Mean, $StandardDeviation, $Value);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
696
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
697 $Mean = Mean($XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
698 $StandardDeviation = _CalculateStandardDeviation($XArrayRef, $Mode);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
699 if (!(defined($StandardDeviation) && $StandardDeviation > 0)) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
700 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
701 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
702 @StandardScores = ();
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
703 for $Value (@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
704 push @StandardScores, ($Value - $Mean)/$StandardDeviation;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
705 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
706
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
707 return @StandardScores;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
708 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
709
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
710 # Compute the product of an array of numbers
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
711 sub Product {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
712 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
713
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
714 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
715 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
716 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
717 my($Product, $Value);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
718 $Product = 1;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
719 foreach $Value (@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
720 $Product *= $Value;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
721 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
722 return $Product;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
723 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
724
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
725 # Compute the sum of an array of numbers
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
726 sub Sum {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
727 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
728
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
729 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
730 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
731 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
732 my($Sum, $Value);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
733 $Sum = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
734 foreach $Value (@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
735 $Sum += $Value;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
736 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
737 return $Sum;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
738 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
739
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
740 # Compute the sum of squares of an array of numbers
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
741 sub SumOfSquares {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
742 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
743
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
744 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
745 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
746 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
747 my($SumOfSquares, $Value);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
748 $SumOfSquares = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
749 foreach $Value (@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
750 $SumOfSquares += $Value ** 2;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
751 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
752 return $SumOfSquares;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
753 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
754
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
755 # Compute the mean of an array of numbers by excluding a fraction of
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
756 # numbers from the top and bottom of the data set.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
757 sub TrimMean {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
758 my($XArrayRef, $FractionToExclude) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
759
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
760 if (!(@$XArrayRef && $FractionToExclude > 0 && $FractionToExclude <= 1)) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
761 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
762 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
763 my($NumberToExclude);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
764 $NumberToExclude = int(@$XArrayRef * $FractionToExclude);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
765 $NumberToExclude = ($NumberToExclude % 2) ? ($NumberToExclude - 1) : $NumberToExclude;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
766 if ($NumberToExclude == @$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
767 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
768 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
769 my($Mean, $Sum, $Index, $FirstIndex, $LastIndex);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
770 $FirstIndex = $NumberToExclude/2;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
771 $LastIndex = @$XArrayRef - ($NumberToExclude/2) - 1;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
772 $Sum = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
773 my(@SortedXArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
774 @SortedXArray = sort { $a <=> $b } @$XArrayRef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
775 for $Index ($FirstIndex .. $LastIndex) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
776 $Sum += $SortedXArray[$Index];
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
777 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
778 $Mean = $Sum/(@SortedXArray - $NumberToExclude);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
779 return $Mean;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
780 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
781
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
782 # Compute the variance of an array of numbers
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
783 sub Variance {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
784 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
785 return _CalculateVariance($XArrayRef, 2);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
786 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
787
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
788 # Compute the variance of an array of numbers representing entire population
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
789 sub VarianceN {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
790 my($XArrayRef) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
791 return _CalculateVariance($XArrayRef, 1);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
792 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
793
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
794 # Compute the variance of an array of numbers:
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
795 # Mode 1: SUM( (x[i] - Xmean)^2 / n )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
796 # Mode 2: SUM( (x[i] - Xmean)^2 / (n - 1) )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
797 #
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
798 sub _CalculateVariance {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
799 my($XArrayRef, $Mode) = @_;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
800
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
801 if (!@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
802 return undef;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
803 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
804 my($Variance, $Value, $SquareOfDeviations, $Mean, $N);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
805
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
806 $Variance = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
807 $Mean = Mean($XArrayRef);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
808 $SquareOfDeviations = 0;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
809 foreach $Value (@$XArrayRef) {
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
810 $SquareOfDeviations += ($Value - $Mean) ** 2;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
811 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
812 $N = ($Mode == 1) ? @$XArrayRef : (@$XArrayRef - 1);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
813 $Variance = $SquareOfDeviations / $N;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
814
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
815 return $Variance;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
816 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
817
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
818 1;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
819
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
820 __END__
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
821
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
822 =head1 NAME
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
823
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
824 StatisticsUtil
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
825
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
826 =head1 SYNOPSIS
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
827
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
828 use StatisticsUtil;
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
829
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
830 use Statistics qw(:all);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
831
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
832 =head1 DESCRIPTION
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
833
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
834 B<StatisticsUtil> module provides the following functions:
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
835
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
836 Average, AverageDeviation, Correlation, Covariance, Euclidean, Factorial,
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
837 FactorialDivison, Frequency, GeometricMean, HarmonicMean, KLargest, KSmallest,
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
838 Kurtosis, Maximum, Mean, Median, Minimum, Mode, PearsonCorrelation, Permutations,
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
839 Product, RSquare, Range, Skewness, StandardDeviation, StandardDeviationN,
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
840 StandardError, StandardScores, StandardScoresN, Standardize, Sum, SumOfSquares,
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
841 TrimMean, Variance, VarianceN
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
842
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
843 =head2 METHODS
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
844
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
845 =over 4
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
846
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
847 =item B<Average>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
848
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
849 $Value = Average(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
850
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
851 Computes the mean of an array of numbers: SUM( x[i] ) / n
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
852
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
853 =item B<AverageDeviation>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
854
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
855 $Value = AverageDeviation(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
856
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
857 Computes the average of the absolute deviation of an array of numbers: SUM( ABS(x[i] - Xmean) ) / n
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
858
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
859 =item B<Correlation>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
860
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
861 $Value = Correlation(\@XDataArray, \@YDataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
862
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
863 Computes the Pearson correlation coefficient between two arrays of numbers:
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
864 SUM( (x[i] - Xmean)(y[i] - Ymean) ) / SQRT( SUM( (x[i] - Xmean)^2 )(SUM( (y[i] - Ymean)^2 )) )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
865
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
866 =item B<Euclidean>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
867
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
868 $Return = Euclidean(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
869
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
870 Computes the euclidean distance of an array of numbers: SQRT( SUM( x[i] ** 2) )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
871
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
872 =item B<Covariance>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
873
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
874 $Value = Covariance(\@XDataArray, \@YDataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
875
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
876 Computes the covariance between two arrays of numbers: SUM( (x[i] - Xmean) (y[i] - Ymean) ) / n
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
877
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
878 =item B<Factorial>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
879
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
880 $Value = Factorial($Num);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
881
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
882 Computes the factorial of a positive integer.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
883
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
884 =item B<FactorialDivison>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
885
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
886 $Value = FactorialDivision($Numerator, $Denominator);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
887
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
888 Compute the factorial divison of two positive integers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
889
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
890 =item B<Frequency>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
891
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
892 %FrequencyValues = Frequency(\@DataArray, [$NumOfBins]);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
893 %FrequencyValues = Frequency(\@DataArray, [\@BinRange]);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
894
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
895 A hash array is returned with keys and values representing range and frequency values, respectively.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
896 The frequency value for a specific key corresponds to all the values which are greater than
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
897 the previous key and less than or equal to the current key. A key value representing maximum value is
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
898 added for generating frequency distribution for specific number of bins, and whenever the maximum
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
899 array value is greater than the maximum specified in bin range, it is also added to bin range.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
900
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
901 =item B<GeometricMean>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
902
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
903 $Value = GeometricMean(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
904
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
905 Computes the geometric mean of an array of numbers: NthROOT( PRODUCT(x[i]) )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
906
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
907 =item B<HarmonicMean>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
908
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
909 $Value = HarmonicMean(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
910
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
911 Computes the harmonic mean of an array of numbers: 1 / ( SUM(1/x[i]) / n )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
912
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
913 =item B<KLargest>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
914
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
915 $Value = KLargest(\@DataArray, $KthNumber);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
916
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
917 Returns the k-largest value from an array of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
918
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
919 =item B<KSmallest>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
920
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
921 $Value = KSmallest(\@DataArray, $KthNumber);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
922
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
923 Returns the k-smallest value from an array of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
924
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
925 =item B<Kurtosis>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
926
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
927 $Value = Kurtosis(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
928
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
929 Computes the kurtosis of an array of numbers:
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
930 [ {n(n + 1)/(n - 1)(n - 2)(n - 3)} SUM{ ((x[i] - Xmean)/STDDEV)^4 } ] - {3((n - 1)^2)}/{(n - 2)(n-3)}
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
931
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
932 =item B<Maximum>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
933
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
934 $Value = Maximum(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
935
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
936 Returns the largest value from an array of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
937
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
938 =item B<Minimum>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
939
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
940 $Value = Minimum(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
941
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
942 Returns the smallest value from an array of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
943
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
944 =item B<Mean>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
945
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
946 $Value = Mean(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
947
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
948 Computes the mean of an array of numbers: SUM( x[i] ) / n
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
949
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
950 =item B<Median>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
951
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
952 $Value = Median(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
953
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
954 Computes the median value of an array of numbers. For an even number array, it's
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
955 the average of two middle values.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
956
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
957 For even values of n: Xsorted[(n - 1)/2 + 1]
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
958 For odd values of n: (Xsorted[n/2] + Xsorted[n/2 + 1])/2
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
959
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
960 =item B<Mode>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
961
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
962 $Value = Mode(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
963
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
964 Returns the most frequently occuring value in an array of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
965
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
966 =item B<PearsonCorrelation>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
967
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
968 $Value = Correlation(\@XDataArray, \@YDataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
969
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
970 Computes the Pearson correlation coefficient between two arrays of numbers:
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
971 SUM( (x[i] - Xmean)(y[i] - Ymean) ) / SQRT( SUM( (x[i] - Xmean)^2 )(SUM( (y[i] - Ymean)^2 )) )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
972
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
973 =item B<Permutations>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
974
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
975 $PermutationsRef = Permutations(@DataToPermute);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
976
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
977 Generate all possible permuations or a specific permutations of items in an array
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
978 and return a reference to an array containing array references to generated permuations.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
979
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
980 This alogrithm is based on the example provided by Mark Jason-Dominus, and is available
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
981 at CPAN as mjd_permute standalone script.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
982
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
983 =item B<Product>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
984
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
985 $Value = Product(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
986
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
987 Compute the product of an array of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
988
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
989 =item B<Range>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
990
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
991 ($Smallest, $Largest) = Range(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
992
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
993 Return the smallest and largest values from an array of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
994
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
995 =item B<RSquare>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
996
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
997 $Value = RSquare(\@XDataArray, \@YDataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
998
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
999 Computes square of the Pearson correlation coefficient between two arrays of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1000
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1001 =item B<Skewness>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1002
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1003 $Value = Skewness(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1004
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1005 Computes the skewness of an array of numbers:
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1006 {n/(n - 1)(n - 2)} SUM{ ((x[i] - Xmean)/STDDEV)^3 }
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1007
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1008 =item B<StandardDeviation>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1009
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1010 $Value = StandardDeviation(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1011
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1012 Computes the standard deviation of an array of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1013 SQRT ( SUM( (x[i] - mean)^2 ) / (n - 1) )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1014
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1015 =item B<StandardDeviationN>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1016
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1017 $Value = StandardDeviationN(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1018
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1019 Computes the standard deviation of an array of numbers representing entire population:
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1020 SQRT ( SUM( (x[i] - mean)^2 ) / n )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1021
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1022 =item B<StandardError>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1023
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1024 $Value = StandardError($StandardDeviation, $Count);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1025
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1026 Computes the standard error using standard deviation and sample size.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1027
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1028 =item B<Standardize>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1029
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1030 $Value = Standardize($Value, $Mean, $StandardDeviation);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1031
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1032 Standardizes the value using mean and standard deviation.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1033
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1034 =item B<StandardScores>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1035
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1036 @Values = StandardScores(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1037
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1038 Computes the standard deviation above the mean for an array of numbers:
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1039 (x[i] - mean) / (n - 1)
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1040
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1041 =item B<StandardScoresN>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1042
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1043 @Values = StandardScoresN(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1044
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1045 Computes the standard deviation above the mean for an array of numbers representing entire population:
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1046 (x[i] - mean) / n
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1047
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1048 =item B<Sum>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1049
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1050 $Value = Sum(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1051
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1052 Compute the sum of an array of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1053
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1054 =item B<SumOfSquares>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1055
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1056 $Value = SumOfSquares(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1057
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1058 Computes the sum of an array of numbers.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1059
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1060 =item B<TrimMean>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1061
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1062 $Value = TrimMean(\@DataArray, $FractionToExclude));
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1063
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1064 Computes the mean of an array of numbers by excluding a fraction of
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1065 numbers from the top and bottom of the data set.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1066
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1067 =item B<Variance>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1068
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1069 $Value = Variance(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1070
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1071 Computes the variance of an array of numbers: SUM( (x[i] - Xmean)^2 / (n - 1) )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1072
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1073 =item B<VarianceN>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1074
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1075 $Value = Variance(\@DataArray);
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1076
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1077 Compute the variance of an array of numbers representing entire population:
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1078 SUM( (x[i] - Xmean)^2 / n )
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1079
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1080 =back
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1081
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1082 =head1 AUTHOR
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1083
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1084 Manish Sud <msud@san.rr.com>
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1085
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1086 =head1 SEE ALSO
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1087
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1088 Constants.pm, ConversionsUtil.pm, MathUtil.pm
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1089
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1090 =head1 COPYRIGHT
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1091
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1092 Copyright (C) 2015 Manish Sud. All rights reserved.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1093
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1094 This file is part of MayaChemTools.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1095
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1096 MayaChemTools is free software; you can redistribute it and/or modify it under
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1097 the terms of the GNU Lesser General Public License as published by the Free
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1098 Software Foundation; either version 3 of the License, or (at your option)
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1099 any later version.
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1100
2abf0d43254d Uploaded
deepakjadmin
parents:
diff changeset
1101 =cut