annotate lib/Fingerprints/FingerprintsBitVector.pm @ 0:4816e4a8ae95 draft default tip

Uploaded
author deepakjadmin
date Wed, 20 Jan 2016 09:23:18 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1 package Fingerprints::FingerprintsBitVector;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
2 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
3 # $RCSfile: FingerprintsBitVector.pm,v $
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
4 # $Date: 2015/02/28 20:48:54 $
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
5 # $Revision: 1.27 $
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
6 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
7 # Author: Manish Sud <msud@san.rr.com>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
8 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
9 # Copyright (C) 2015 Manish Sud. All rights reserved.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
10 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
11 # This file is part of MayaChemTools.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
12 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
13 # MayaChemTools is free software; you can redistribute it and/or modify it under
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
14 # the terms of the GNU Lesser General Public License as published by the Free
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
15 # Software Foundation; either version 3 of the License, or (at your option) any
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
16 # later version.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
17 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
18 # MayaChemTools is distributed in the hope that it will be useful, but without
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
19 # any warranty; without even the implied warranty of merchantability of fitness
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
20 # for a particular purpose. See the GNU Lesser General Public License for more
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
21 # details.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
22 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
23 # You should have received a copy of the GNU Lesser General Public License
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
24 # along with MayaChemTools; if not, see <http://www.gnu.org/licenses/> or
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
25 # write to the Free Software Foundation Inc., 59 Temple Place, Suite 330,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
26 # Boston, MA, 02111-1307, USA.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
27 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
28
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
29 use strict;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
30 use Carp;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
31 use Exporter;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
32 use Scalar::Util ();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
33 use BitVector;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
34 use MathUtil;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
35 use TextUtil ();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
36
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
37 use vars qw(@ISA @EXPORT @EXPORT_OK %EXPORT_TAGS);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
38
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
39 @ISA = qw(BitVector Exporter);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
40
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
41 # Similiarity coefficients...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
42 my(@SimilarityCoefficients) = qw(BaroniUrbaniSimilarityCoefficient BuserSimilarityCoefficient CosineSimilarityCoefficient DiceSimilarityCoefficient DennisSimilarityCoefficient ForbesSimilarityCoefficient FossumSimilarityCoefficient HamannSimilarityCoefficient JacardSimilarityCoefficient Kulczynski1SimilarityCoefficient Kulczynski2SimilarityCoefficient MatchingSimilarityCoefficient McConnaugheySimilarityCoefficient OchiaiSimilarityCoefficient PearsonSimilarityCoefficient RogersTanimotoSimilarityCoefficient RussellRaoSimilarityCoefficient SimpsonSimilarityCoefficient SkoalSneath1SimilarityCoefficient SkoalSneath2SimilarityCoefficient SkoalSneath3SimilarityCoefficient TanimotoSimilarityCoefficient TverskySimilarityCoefficient YuleSimilarityCoefficient WeightedTanimotoSimilarityCoefficient WeightedTverskySimilarityCoefficient);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
43
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
44 # New from string...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
45 my(@NewFromString) = qw(NewFromBinaryString NewFromHexadecimalString NewFromRawBinaryString);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
46
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
47 @EXPORT = qw(IsFingerprintsBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
48 @EXPORT_OK = qw(GetSupportedSimilarityCoefficients @NewFromString @SimilarityCoefficients);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
49
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
50 %EXPORT_TAGS = (
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
51 new => [@NewFromString],
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
52 coefficients => [@SimilarityCoefficients],
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
53 all => [@EXPORT, @EXPORT_OK]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
54 );
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
55
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
56 # Setup class variables...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
57 my($ClassName);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
58 _InitializeClass();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
59
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
60 use overload '""' => 'StringifyFingerprintsBitVector';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
61
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
62 # Class constructor...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
63 sub new {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
64 my($Class, $Size) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
65
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
66 # Initialize object...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
67 my $This = $Class->SUPER::new($Size);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
68 bless $This, ref($Class) || $Class;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
69 $This->_InitializeFingerprintsBitVector($Size);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
70
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
71 return $This;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
72 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
73
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
74 # Initialize object data...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
75 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
76 # Note:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
77 # . The class, BitVector, used to derive this class provides all the functionality to
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
78 # manipulate bits.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
79 # . Irrespective of specified size, Perl functions used to handle bit data in
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
80 # BitVector class automatically sets the size to the next nearest power of 2.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
81 # SpecifiedSize is used by this class to process any aribitray size during similarity
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
82 # coefficient calculations.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
83 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
84 sub _InitializeFingerprintsBitVector {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
85 my($This, $Size) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
86
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
87 if (!defined $Size) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
88 croak "Error: ${ClassName}->new: FingerprintsBitVector object instantiated without specifying its size ...";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
89 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
90 if ($Size <=0) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
91 croak "Error: ${ClassName}->new: Fingerprints bit vector size, $Size, must be a positive integer...";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
92 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
93
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
94 # Specified size of fingerprints...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
95 $This->{SpecifiedSize} = $Size;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
96
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
97 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
98
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
99 # Initialize class ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
100 sub _InitializeClass {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
101 #Class name...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
102 $ClassName = __PACKAGE__;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
103 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
104
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
105 # Set specified size...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
106 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
107 # Notes:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
108 # Irrespective of specified size, Perl functions used to handle bit data in
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
109 # BitVector class automatically sets the size to the next nearest power of 2.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
110 # SpecifiedSize is used by this class to process any aribitray size during similarity
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
111 # coefficient calculations.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
112 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
113 sub SetSpecifiedSize {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
114 my($This, $SpecifiedSize) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
115
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
116 if (!($SpecifiedSize > 0 && $SpecifiedSize <= $This->{Size})) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
117 croak "Error: ${ClassName}->SetSpecifiedSize: Specified size, $SpecifiedSize, is not valid: It must be > 0 && <= ", $This->GetSize()," ...";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
118 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
119 $This->{SpecifiedSize} = $SpecifiedSize;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
120 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
121
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
122 # Get specified size...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
123 sub GetSpecifiedSize {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
124 my($This) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
125
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
126 return $This->{SpecifiedSize};
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
127 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
128
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
129 # Set ID...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
130 sub SetID {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
131 my($This, $Value) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
132
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
133 $This->{ID} = $Value;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
134
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
135 return $This;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
136 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
137
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
138 # Get ID...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
139 sub GetID {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
140 my($This) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
141
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
142 return exists $This->{ID} ? $This->{ID} : 'None';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
143 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
144
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
145 # Set description...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
146 sub SetDescription {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
147 my($This, $Value) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
148
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
149 $This->{Description} = $Value;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
150
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
151 return $This;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
152 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
153
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
154 # Get description...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
155 sub GetDescription {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
156 my($This) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
157
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
158 return exists $This->{Description} ? $This->{Description} : 'No description available';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
159 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
160
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
161 # Set vector type...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
162 sub SetVectorType {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
163 my($This, $Value) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
164
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
165 $This->{VectorType} = $Value;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
166
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
167 return $This;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
168 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
169
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
170 # Get vector type...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
171 sub GetVectorType {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
172 my($This) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
173
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
174 return exists $This->{VectorType} ? $This->{VectorType} : 'FingerprintsBitVector';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
175 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
176
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
177 # Create a new fingerprints bit vector using binary string. This functionality can be
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
178 # either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
179 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
180 sub NewFromBinaryString ($;$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
181 my($FirstParameter, $SecondParameter, $ThirdParameter) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
182
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
183 if (_IsFingerprintsBitVector($FirstParameter)) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
184 return _NewFingerptinsBitVectorFromString('Binary', $SecondParameter, $ThirdParameter);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
185 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
186 else {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
187 return _NewFingerptinsBitVectorFromString( 'Binary', $FirstParameter, $SecondParameter);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
188 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
189 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
190
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
191 # Create a new fingerprints bit vector using hexadecimal string. This functionality can be
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
192 # either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
193 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
194 sub NewFromHexadecimalString ($;$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
195 my($FirstParameter, $SecondParameter, $ThirdParameter) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
196
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
197 if (_IsFingerprintsBitVector($FirstParameter)) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
198 return _NewFingerptinsBitVectorFromString('Hexadecimal', $SecondParameter, $ThirdParameter);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
199 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
200 else {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
201 return _NewFingerptinsBitVectorFromString( 'Hexadecimal', $FirstParameter, $SecondParameter);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
202 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
203 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
204
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
205 # Create a new fingerprints bit vector using octal string. This functionality can be
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
206 # either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
207 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
208 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
209 sub NewFromOctalString ($) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
210 croak "Error: ${ClassName}->NewFromOctalString: Creation of fingerprits bit vector from an octal string is not supported ...";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
211 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
212
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
213 # Create a new fingerprints bit vector using decimal string. This functionality can be
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
214 # either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
215 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
216 sub NewFromDecimalString ($;$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
217 croak "Error: ${ClassName}->NewFromDecimalString: Creation of fingerprits bit vector from a decimal string is not supported ...";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
218 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
219
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
220 # Create a new fingerprints bit vector using raw binary string. This functionality can be
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
221 # either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
222 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
223 sub NewFromRawBinaryString ($;$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
224 my($FirstParameter, $SecondParameter, $ThirdParameter) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
225
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
226 if (_IsFingerprintsBitVector($FirstParameter)) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
227 return _NewFingerptinsBitVectorFromString('RawBinary', $SecondParameter, $ThirdParameter);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
228 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
229 else {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
230 return _NewFingerptinsBitVectorFromString( 'RawBinary', $FirstParameter, $SecondParameter);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
231 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
232 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
233
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
234 # Create a new fingerprints bit vector from a string...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
235 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
236 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
237 sub _NewFingerptinsBitVectorFromString ($$;$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
238 my($Format, $String, $BitsOrder) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
239 my($FingerprintsBitVector, $Size);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
240
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
241 $Size = BitVector::_CalculateStringSizeInBits($Format, $String);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
242
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
243 $FingerprintsBitVector = new Fingerprints::FingerprintsBitVector($Size);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
244 $FingerprintsBitVector->_SetBitsAsString($Format, $String, $BitsOrder);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
245
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
246 return $FingerprintsBitVector;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
247 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
248
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
249 # Get fingerprint bits as a hexadecimal string...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
250 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
251 sub GetBitsAsHexadecimalString {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
252 my($This, $BitsOrder) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
253
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
254 return $This->_GetFingerprintBitsAsString('Hexadecimal', $BitsOrder);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
255 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
256
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
257 # Get fingerprint bits as an octal string...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
258 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
259 sub GetBitsAsOctalString {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
260 my($This, $BitsOrder) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
261
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
262 croak "Error: ${ClassName}->GetBitsAsOctalString: Retrieval of fingerprits bits as an octal string is not supported ...";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
263 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
264
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
265 # Get fingerprint bits as an decimal string...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
266 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
267 sub GetBitsAsDecimalString {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
268 my($This, $BitsOrder) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
269
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
270 croak "Error: ${ClassName}->GetBitsAsOctalString: Retrieval of fingerprits bits as a decimal string is not supported ...";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
271 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
272
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
273 # Get fingerprint bits as a binary string conatning 1s and 0s...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
274 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
275 sub GetBitsAsBinaryString {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
276 my($This, $BitsOrder) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
277
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
278 return $This->_GetFingerprintBitsAsString('Binary', $BitsOrder);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
279 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
280
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
281 # Get fingerprint bits as a binary string conatning 1s and 0s...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
282 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
283 sub GetBitsAsRawBinaryString {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
284 my($This) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
285
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
286 return $This->_GetFingerprintBitsAsString('RawBinary');
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
287 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
288
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
289 # Return fingerprint bits as a string...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
290 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
291 sub _GetFingerprintBitsAsString {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
292 my($This, $Format, $BitsOrder) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
293
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
294 $BitsOrder = (defined($BitsOrder) && $BitsOrder) ? $BitsOrder : 'Ascending';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
295
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
296 return $This->_GetBitsAsString($Format, $BitsOrder);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
297 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
298
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
299 # Is it a fingerprints bit vector object?
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
300 sub IsFingerprintsBitVector ($) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
301 my($Object) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
302
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
303 return _IsFingerprintsBitVector($Object);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
304 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
305
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
306 # Is it a fingerprints bit vector object?
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
307 sub _IsFingerprintsBitVector {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
308 my($Object) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
309
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
310 return (Scalar::Util::blessed($Object) && $Object->isa($ClassName)) ? 1 : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
311 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
312
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
313 # Return a list of supported similarity coefficients...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
314 sub GetSupportedSimilarityCoefficients () {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
315
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
316 return @SimilarityCoefficients;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
317 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
318
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
319 # Get bit density for fingerprints bit vector corresponding to on bits...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
320 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
321 sub GetFingerprintsBitDensity {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
322 my($This) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
323 my($BitDensity);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
324
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
325 $BitDensity = $This->GetDensityOfSetBits();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
326
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
327 return round($BitDensity, 2);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
328 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
329
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
330 # Fold fingerprints bit vector by recursively reducing its size by half untill size is less than or equal to
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
331 # specified size...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
332 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
333 sub FoldFingerprintsBitVectorBySize {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
334 my($This, $Size) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
335
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
336 if (!($Size > 0 && $Size <= $This->GetSize())) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
337 croak "Error: ${ClassName}->FoldFingerprintsBitVectorBySize: Specified size, $Size, is not valid: It must be > 0 && <= ", $This->GetSize()," ...";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
338 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
339
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
340 if ($This->GetSize() <= $Size) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
341 return $This;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
342 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
343 return $This->_FoldFingerprintsBitVector('BySize', $Size);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
344 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
345
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
346 # Fold fingerprints bit vector by recursively reducing its size by half untill bit density of set bits is greater than
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
347 # or equal to specified density...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
348 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
349 sub FoldFingerprintsBitVectorByDensity {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
350 my($This, $Density) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
351
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
352 if (!($Density > 0 && $Density <= 1)) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
353 croak "Error: ${ClassName}->FoldFingerprintsBitVectorByDensity: Specified bit density, $Density, is not valid: It must be > 0 && <= 1 ...";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
354 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
355
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
356 if ($This->GetDensityOfSetBits() >= $Density) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
357 return $This;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
358 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
359 return $This->_FoldFingerprintsBitVector('ByDensity', $Density);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
360 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
361
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
362 # Fold fingerprints bit vector using size or density and return folded fingerprint bit vector...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
363 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
364 sub _FoldFingerprintsBitVector {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
365 my($This, $Mode, $Value) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
366
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
367 # Fold upto size of 8 bits...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
368 if ($This->GetSize() <= 8) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
369 return $This;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
370 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
371
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
372 # Check size or density....
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
373 if ($Mode =~ /^BySize$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
374 if ($This->GetSize() <= $Value) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
375 return $This;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
376 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
377 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
378 elsif ($Mode =~ /^ByDensity$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
379 if ($This->GetDensityOfSetBits() >= $Value) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
380 return $This;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
381 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
382 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
383 else {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
384 return $This;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
385 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
386
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
387 # Recursively reduce its size by half...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
388 my($FirstHalfBinaryString, $SecondHalfBinaryString, $FirstHalfFingerprintsBitVector, $SecondHalfFingerprintsBitVector, $FoldedFingerprintsBitVector, $BinaryString, $StringLength);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
389
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
390 $BinaryString = $This->GetBitsAsBinaryString();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
391 $StringLength = length $BinaryString;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
392
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
393 $FirstHalfBinaryString = substr($BinaryString, 0, $StringLength/2);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
394 $SecondHalfBinaryString = substr($BinaryString, $StringLength/2);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
395
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
396 $FirstHalfFingerprintsBitVector = NewFromBinaryString($FirstHalfBinaryString);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
397 $SecondHalfFingerprintsBitVector = NewFromBinaryString($SecondHalfBinaryString);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
398
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
399 $FoldedFingerprintsBitVector = $FirstHalfFingerprintsBitVector | $SecondHalfFingerprintsBitVector;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
400
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
401 return $FoldedFingerprintsBitVector->_FoldFingerprintsBitVector($Mode, $Value);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
402 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
403
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
404 # Is first bit vector subset of second bit vector?
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
405 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
406 # For a bit vector to be a subset of another bit vector, both vectors must be of
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
407 # the same size and the bit positions set in first vector must also be set in the
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
408 # secons bit vector.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
409 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
410 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
411 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
412 sub IsSubSet ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
413 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
414
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
415 if ($FingerprintsBitVectorA->GetSize() != $FingerprintsBitVectorB->GetSize()) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
416 return 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
417 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
418 my($AndFingerprintsBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
419
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
420 $AndFingerprintsBitVector = $FingerprintsBitVectorA & $FingerprintsBitVectorB;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
421
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
422 return ($FingerprintsBitVectorA->GetNumOfSetBits() == $AndFingerprintsBitVector->GetNumOfSetBits()) ? 1 : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
423 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
424
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
425 # Return a string containing vector values...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
426 sub StringifyFingerprintsBitVector {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
427 my($This) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
428 my($FingerprintsBitVectorString);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
429
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
430 # BitVector size information...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
431 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
432 if ($This->{SpecifiedSize} != $This->GetSize()) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
433 $FingerprintsBitVectorString = "SpecifiedSize: " . $This->{SpecifiedSize} . "; BitVectorSize: " . $This->GetSize();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
434 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
435 else {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
436 $FingerprintsBitVectorString = "BitVectorSize: " . $This->GetSize();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
437 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
438 my($NumOfSetBits, $BitDensity);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
439 $NumOfSetBits = $This->GetNumOfSetBits();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
440 $BitDensity = $This->GetFingerprintsBitDensity();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
441
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
442 $FingerprintsBitVectorString .= "; NumOfOnBits: $NumOfSetBits; BitDensity: $BitDensity";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
443
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
444 # BitVector values...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
445 $FingerprintsBitVectorString .= "; BitVector: " . $This->StringifyBitVector();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
446
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
447 return $FingerprintsBitVectorString;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
448 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
449
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
450 # For two fingerprints bit vectors A and B of same size, let:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
451 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
452 # Na = Number of bits set to "1" in A
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
453 # Nb = Number of bits set to "1" in B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
454 # Nc = Number of bits set to "1" in both A and B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
455 # Nd = Number of bits set to "0" in both A and B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
456 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
457 # Nt = Number of bits set to "1" or "0" in A or B = Size of A or B = Na + Nb - Nc + Nd
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
458 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
459 # Na - Nc = Number of bits set to "1" in A but not in B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
460 # Nb - Nc = Number of bits set to "1" in B but not in A
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
461 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
462 # Various similarity coefficients [ Ref 40 - 42 ] for a pair of bit vectors A and B are
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
463 # defined as follows:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
464 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
465 # . BaroniUrbani: ( SQRT( Nc * Nd ) + Nc ) / ( SQRT ( Nc * Nd ) + Nc + ( Na - Nc ) + ( Nb - Nc ) ) ( same as Buser )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
466 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
467 # . Buser: ( SQRT ( Nc * Nd ) + Nc ) / ( SQRT ( Nc * Nd ) + Nc + ( Na - Nc ) + ( Nb - Nc ) ) ( same as BaroniUrbani )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
468 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
469 # . Cosine: Nc / SQRT ( Na * Nb ) (same as Ochiai)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
470 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
471 # . Dice: (2 * Nc) / ( Na + Nb )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
472 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
473 # . Dennis: ( Nc * Nd - ( ( Na - Nc ) * ( Nb - Nc ) ) ) / SQRT ( Nt * Na * Nb)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
474 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
475 # . Forbes: ( Nt * Nc ) / ( Na * Nb )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
476 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
477 # . Fossum: ( Nt * ( ( Nc - 1/2 ) ** 2 ) / ( Na * Nb )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
478 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
479 # . Hamann: ( ( Nc + Nd ) - ( Na - Nc ) - ( Nb - Nc ) ) / Nt
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
480 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
481 # . Jaccard: Nc / ( ( Na - Nc) + ( Nb - Nc ) + Nc ) = Nc / ( Na + Nb - Nc ) (same as Tanimoto)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
482 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
483 # . Kulczynski1: Nc / ( ( Na - Nc ) + ( Nb - Nc) ) = Nc / ( Na + Nb - 2Nc )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
484 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
485 # . Kulczynski2: ( ( Nc / 2 ) * ( 2 * Nc + ( Na - Nc ) + ( Nb - Nc) ) ) / ( ( Nc + ( Na - Nc ) ) * ( Nc + ( Nb - Nc ) ) ) = 0.5 * ( Nc / Na + Nc / Nb )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
486 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
487 # . Matching: ( Nc + Nd ) / Nt
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
488 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
489 # . McConnaughey: ( Nc ** 2 - ( Na - Nc ) * ( Nb - Nc) ) / ( Na * Nb )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
490 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
491 # . Ochiai: Nc / SQRT ( Na * Nb ) (same as Cosine)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
492 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
493 # . Pearson: ( ( Nc * Nd ) - ( ( Na - Nc ) * ( Nb - Nc ) ) / SQRT ( Na * Nb * ( Na - Nc + Nd ) * ( Nb - Nc + Nd ) )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
494 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
495 # . RogersTanimoto: ( Nc + Nd ) / ( ( Na - Nc) + ( Nb - Nc) + Nt) = ( Nc + Nd ) / ( Na + Nb - 2Nc + Nt)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
496 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
497 # . RussellRao: Nc / Nt
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
498 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
499 # . Simpson: Nc / MIN ( Na, Nb)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
500 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
501 # . SkoalSneath1: Nc / ( Nc + 2 * ( Na - Nc) + 2 * ( Nb - Nc) ) = Nc / ( 2 * Na + 2 * Nb - 3 * Nc )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
502 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
503 # . SkoalSneath2: ( 2 * Nc + 2 * Nd ) / ( Nc + Nd + Nt )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
504 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
505 # . SkoalSneath3: ( Nc + Nd ) / ( ( Na - Nc ) + ( Nb - Nc ) ) = ( Nc + Nd ) / ( Na + Nb - 2 * Nc )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
506 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
507 # . Tanimoto: Nc / ( ( Na - Nc) + ( Nb - Nc ) + Nc ) = Nc / ( Na + Nb - Nc ) (same as Jaccard)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
508 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
509 # . Tversky: Nc / ( alpha * ( Na - Nc ) + ( 1 - alpha) * ( Nb - Nc) + Nc ) = Nc / ( alpha * ( Na - Nb ) + Nb)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
510 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
511 # . Yule: ( ( Nc * Nd ) - ( ( Na - Nc ) * ( Nb - Nc ) ) ) / ( ( Nc * Nd ) + ( ( Na - Nc ) * ( Nb - Nc ) ) )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
512 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
513 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
514 # Values of Tanimoto/Jaccard and Tversky coefficients are dependent on only those bit which
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
515 # are set to "1" in both A and B. In order to take into account all bit positions, modified versions
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
516 # of Tanimoto [ Ref. 42 ] and Tversky [ Ref. 43 ] have been developed.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
517 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
518 # Let:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
519 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
520 # Na' = Number of bits set to "0" in A
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
521 # Nb' = Number of bits set to "0" in B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
522 # Nc' = Number of bits set to "0" in both A and B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
523 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
524 # . Tanimoto': Nc' / ( ( Na' - Nc') + ( Nb' - Nc' ) + Nc' ) = Nc' / ( Na' + Nb' - Nc' )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
525 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
526 # . Tversky': Nc' / ( alpha * ( Na' - Nc' ) + ( 1 - alpha) * ( Nb' - Nc' ) + Nc' ) = Nc' / ( alpha * ( Na' - Nb' ) + Nb')
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
527 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
528 # Then:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
529 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
530 # . WeightedTanimoto = beta * Tanimoto + (1 - beta) * Tanimoto'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
531 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
532 # . WeightedTversky = beta * Tversky + (1 - beta) * Tversky'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
533 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
534 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
535
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
536 # Calculate BaroniUrbani similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
537 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
538 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
539 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
540 sub BaroniUrbaniSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
541 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
542
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
543 return BuserSimilarityCoefficient($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
544 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
545
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
546 # Calculate Buser similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
547 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
548 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
549 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
550 sub BuserSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
551 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
552 my($Na, $Nb, $Nc, $Nd, $Nt, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
553
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
554 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
555 $Nd = _GetNumOfCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
556 $Nt = $Na + $Nb - $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
557
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
558 $Numerator = sqrt($Nc*$Nd) + $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
559 $Denominator = sqrt($Nc*$Nd) + ($Na - $Nc) + ($Nb - $Nc ) + $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
560
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
561 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
562 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
563
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
564 # Calculate Cosine similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
565 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
566 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
567 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
568 sub CosineSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
569 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
570 my($Na, $Nb, $Nc, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
571
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
572 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
573
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
574 $Numerator = $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
575 $Denominator = sqrt($Na*$Nb);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
576
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
577 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
578 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
579
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
580 # Calculate Dice similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
581 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
582 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
583 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
584 sub DiceSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
585 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
586 my($Na, $Nb, $Nc, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
587
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
588 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
589
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
590 $Numerator = 2*$Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
591 $Denominator = $Na + $Nb;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
592
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
593 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
594 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
595
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
596 # Calculate Dennis similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
597 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
598 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
599 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
600 sub DennisSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
601 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
602 my($Na, $Nb, $Nc, $Nd, $Nt, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
603
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
604 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
605 $Nd = _GetNumOfCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
606 $Nt = $Na + $Nb - $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
607
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
608 $Numerator = $Nc*$Nd - (($Na - $Nc)*($Nb - $Nc));
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
609 $Denominator = sqrt($Nt*$Na*$Nb);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
610
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
611 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
612 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
613
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
614 # Calculate Forbes similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
615 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
616 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
617 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
618 sub ForbesSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
619 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
620 my($Na, $Nb, $Nc, $Nd, $Nt, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
621
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
622 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
623 $Nd = _GetNumOfCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
624 $Nt = $Na + $Nb - $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
625
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
626 $Numerator = $Nt*$Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
627 $Denominator = $Na*$Nb;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
628
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
629 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
630 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
631
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
632 # Calculate Fossum similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
633 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
634 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
635 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
636 sub FossumSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
637 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
638 my($Na, $Nb, $Nc, $Nd, $Nt, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
639
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
640 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
641 $Nd = _GetNumOfCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
642 $Nt = $Na + $Nb - $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
643
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
644 $Numerator = $Nt*(($Nc - 0.5)** 2);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
645 $Denominator = $Na*$Nb ;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
646
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
647 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
648 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
649
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
650 # Calculate Hamann similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
651 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
652 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
653 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
654 sub HamannSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
655 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
656 my($Na, $Nb, $Nc, $Nd, $Nt, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
657
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
658 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
659 $Nd = _GetNumOfCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
660 $Nt = $Na + $Nb - $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
661
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
662 $Numerator = ($Nc + $Nd ) - ($Na - $Nc) - ($Nb - $Nc) ;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
663 $Denominator = $Nt;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
664
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
665 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
666 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
667
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
668 # Calculate Jacard similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
669 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
670 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
671 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
672 sub JacardSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
673 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
674
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
675 return TanimotoSimilarityCoefficient($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
676 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
677
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
678 # Calculate Kulczynski1 similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
679 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
680 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
681 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
682 sub Kulczynski1SimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
683 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
684 my($Na, $Nb, $Nc, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
685
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
686 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
687
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
688 $Numerator = $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
689 $Denominator = $Na + $Nb - 2*$Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
690
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
691 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
692 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
693
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
694 # Calculate Kulczynski2 similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
695 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
696 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
697 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
698 sub Kulczynski2SimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
699 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
700 my($Na, $Nb, $Nc, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
701
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
702 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
703
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
704 $Numerator = 0.5*($Na*$Nc + $Nb*$Nc);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
705 $Denominator = $Na*$Nb;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
706
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
707 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
708 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
709
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
710 # Calculate Matching similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
711 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
712 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
713 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
714 sub MatchingSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
715 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
716 my($Na, $Nb, $Nc, $Nd, $Nt, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
717
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
718 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
719 $Nd = _GetNumOfCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
720 $Nt = $Na + $Nb - $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
721
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
722 $Numerator = $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
723 $Denominator = $Nt;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
724
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
725 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
726 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
727
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
728 # Calculate McConnaughey similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
729 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
730 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
731 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
732 sub McConnaugheySimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
733 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
734 my($Na, $Nb, $Nc, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
735
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
736 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
737
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
738 $Numerator = $Nc**2 - (($Na - $Nc)*($Nb - $Nc));
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
739 $Denominator = $Na*$Nb ;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
740
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
741 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
742 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
743
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
744 # Calculate Ochiai similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
745 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
746 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
747 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
748 sub OchiaiSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
749 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
750
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
751 return CosineSimilarityCoefficient($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
752 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
753
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
754 # Calculate Pearson similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
755 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
756 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
757 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
758 sub PearsonSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
759 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
760 my($Na, $Nb, $Nc, $Nd, $Nt, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
761
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
762 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
763 $Nd = _GetNumOfCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
764 $Nt = $Na + $Nb - $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
765
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
766 $Numerator = ($Nc*$Nd ) - (($Na - $Nc)*($Nb - $Nc));
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
767 $Denominator = sqrt($Na*$Nb*($Na - $Nc + $Nd )*($Nb - $Nc + $Nd));
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
768
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
769 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
770 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
771
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
772 # Calculate RogersTanimoto similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
773 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
774 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
775 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
776 sub RogersTanimotoSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
777 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
778 my($Na, $Nb, $Nc, $Nd, $Nt, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
779
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
780 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
781 $Nd = _GetNumOfCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
782 $Nt = $Na + $Nb - $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
783
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
784 $Numerator = $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
785 $Denominator = ($Na - $Nc) + ($Nb - $Nc) + $Nt;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
786
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
787 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
788 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
789
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
790 # Calculate RussellRao similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
791 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
792 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
793 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
794 sub RussellRaoSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
795 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
796 my($Na, $Nb, $Nc, $Nd, $Nt, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
797
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
798 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
799 $Nd = _GetNumOfCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
800 $Nt = $Na + $Nb - $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
801
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
802 $Numerator = $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
803 $Denominator = $Nt;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
804
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
805 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
806 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
807
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
808 # Calculate Simpson similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
809 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
810 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
811 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
812 sub SimpsonSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
813 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
814 my($Na, $Nb, $Nc, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
815
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
816 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
817
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
818 $Numerator = $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
819 $Denominator = min($Na, $Nb);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
820
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
821 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
822 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
823
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
824 # Calculate SkoalSneath1 similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
825 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
826 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
827 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
828 sub SkoalSneath1SimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
829 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
830 my($Na, $Nb, $Nc, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
831
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
832 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
833
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
834 $Numerator = $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
835 $Denominator = $Nc + 2*($Na - $Nc) + 2*($Nb - $Nc);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
836
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
837 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
838 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
839
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
840 # Calculate SkoalSneath2 similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
841 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
842 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
843 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
844 sub SkoalSneath2SimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
845 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
846 my($Na, $Nb, $Nc, $Nd, $Nt, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
847
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
848 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
849 $Nd = _GetNumOfCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
850 $Nt = $Na + $Nb - $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
851
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
852 $Numerator = 2*$Nc + 2*$Nd ;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
853 $Denominator = $Nc + $Nd + $Nt ;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
854
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
855 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
856 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
857
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
858 # Calculate SkoalSneath3 similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
859 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
860 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
861 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
862 sub SkoalSneath3SimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
863 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
864 my($Na, $Nb, $Nc, $Nd, $Nt, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
865
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
866 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
867 $Nd = _GetNumOfCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
868 $Nt = $Na + $Nb - $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
869
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
870 $Numerator = $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
871 $Denominator = ($Na - $Nc) + ($Nb - $Nc ) ;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
872
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
873 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
874 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
875
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
876 # Calculate Tanimoto similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
877 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
878 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
879 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
880 sub TanimotoSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
881 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
882 my($Na, $Nb, $Nc, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
883
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
884 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
885
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
886 $Numerator = $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
887 $Denominator = $Na + $Nb - $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
888
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
889 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
890 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
891
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
892 # Calculate Tversky similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
893 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
894 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
895 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
896 sub TverskySimilarityCoefficient ($$$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
897 my($FingerprintsBitVectorA, $FingerprintsBitVectorB, $Alpha) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
898 my($Na, $Nb, $Nc, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
899
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
900 if (!(defined($Alpha) && ($Alpha >= 0 && $Alpha <= 1))) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
901 croak "Error: ${ClassName}->TverskySimilarityCoefficient: Alpha parameters must be defined and its value must be >=0 and <=1 ...";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
902 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
903
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
904 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
905
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
906 $Numerator = $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
907 $Denominator = $Alpha*($Na - $Nb ) + $Nb;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
908
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
909 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
910 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
911
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
912 # Calculate Yule similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
913 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
914 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
915 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
916 sub YuleSimilarityCoefficient ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
917 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
918 my($Na, $Nb, $Nc, $Nd, $Nt, $Numerator, $Denominator);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
919
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
920 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
921 $Nd = _GetNumOfCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
922 $Nt = $Na + $Nb - $Nc + $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
923
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
924 $Numerator = ($Nc*$Nd) - (($Na - $Nc)*($Nb - $Nc)) ;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
925 $Denominator = ($Nc*$Nd) + (($Na - $Nc)*($Nb - $Nc)) ;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
926
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
927 return $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
928 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
929
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
930 # Calculate WeightedTanimoto similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
931 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
932 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
933 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
934 sub WeightedTanimotoSimilarityCoefficient ($$$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
935 my($FingerprintsBitVectorA, $FingerprintsBitVectorB, $Beta) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
936 my($Na, $Nb, $Nc, $TanimotoForSetBits, $TanimotoForClearBits, $Numerator, $Denominator, $WeightedTanimoto);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
937
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
938 if (!(defined($Beta) && ($Beta >= 0 && $Beta <= 1))) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
939 croak "Error: ${ClassName}->WeightedTanimotoSimilarityCoefficient: Beta parameters must be defined and its value must be >=0 and <=1 ...";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
940 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
941
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
942 # Get Tanimoto for set bits...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
943 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
944
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
945 $Numerator = $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
946 $Denominator = $Na + $Nb - $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
947 $TanimotoForSetBits = $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
948
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
949 # Get Tanimoto for clear bits...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
950 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
951
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
952 $Numerator = $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
953 $Denominator = $Na + $Nb - $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
954 $TanimotoForClearBits = $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
955
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
956 $WeightedTanimoto = $Beta*$TanimotoForSetBits + (1 - $Beta)*$TanimotoForClearBits;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
957
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
958 return $WeightedTanimoto;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
959 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
960
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
961 # Calculate WeightedTversky similarity coefficient for two same size bit vectors.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
962 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
963 # This functionality can be either invoked as a class function or an object method.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
964 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
965 sub WeightedTverskySimilarityCoefficient ($$$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
966 my($FingerprintsBitVectorA, $FingerprintsBitVectorB, $Alpha, $Beta) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
967 my($Na, $Nb, $Nc, $TverskyForSetBits, $TverskyForClearBits, $Numerator, $Denominator, $WeightedTversky);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
968
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
969 if (!(defined($Alpha) && ($Alpha >= 0 && $Alpha <= 1))) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
970 croak "Error: ${ClassName}->WeightedTverskySimilarityCoefficient: Alpha parameters must be defined and its value must be >=0 and <=1 ...";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
971 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
972 if (!(defined($Beta) && ($Beta >= 0 && $Beta <= 1))) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
973 croak "Error: ${ClassName}->WeightedTverskySimilarityCoefficient: Beta parameters must be defined and its value must be >=0 and <=1 ...";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
974 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
975
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
976 # Get Tversky for set bits...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
977 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonSetBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
978
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
979 $Numerator = $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
980 $Denominator = $Alpha*($Na - $Nb ) + $Nb;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
981 $TverskyForSetBits = $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
982
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
983 # Get Tversky for clear bits...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
984 ($Na, $Nb, $Nc) = _GetNumOfIndividualAndCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
985
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
986 $Numerator = $Nc;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
987 $Denominator = $Alpha*($Na - $Nb ) + $Nb;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
988 $TverskyForClearBits = $Denominator ? ($Numerator/$Denominator) : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
989
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
990 $WeightedTversky = $Beta*$TverskyForSetBits + (1 - $Beta)*$TverskyForClearBits;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
991
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
992 return $WeightedTversky;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
993 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
994
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
995 # Get number of Na, Nb and Nc bits in bit vector A and B to be used for similarity coefficient calculations...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
996 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
997 sub _GetNumOfIndividualAndCommonSetBits ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
998 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
999 my($Na, $Nb, $Nc, $Nd);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1000
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1001 # Number of bits set to "1" in A
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1002 $Na = $FingerprintsBitVectorA->GetNumOfSetBits();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1003
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1004 # Number of bits set to "1" in B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1005 $Nb = $FingerprintsBitVectorB->GetNumOfSetBits();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1006
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1007 # Number of bits set to "1" in both A and B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1008 my($NcBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1009 $NcBitVector = $FingerprintsBitVectorA & $FingerprintsBitVectorB;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1010 $Nc = $NcBitVector->GetNumOfSetBits();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1011
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1012 return ($Na, $Nb, $Nc);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1013 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1014
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1015 # Get number of Nd bits in bit vector A and B to be used for similarity coefficient calculations...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1016 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1017 sub _GetNumOfCommonClearBits ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1018 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1019 my($Nd, $NdBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1020
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1021 # Number of bits set to "0" in both A and B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1022 $NdBitVector = ~$FingerprintsBitVectorA & ~$FingerprintsBitVectorB;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1023 $Nd = $NdBitVector->GetNumOfSetBits();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1024
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1025 # Correct for number of clear bits used for padding...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1026 if (_IsNumOfClearBitsCorrectionRequired($FingerprintsBitVectorA)) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1027 $Nd = $Nd - _GetNumOfClearBitsCorrection($FingerprintsBitVectorA);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1028 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1029 elsif (_IsNumOfClearBitsCorrectionRequired($FingerprintsBitVectorB)) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1030 $Nd = $Nd - _GetNumOfClearBitsCorrection($FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1031 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1032
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1033 return $Nd;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1034 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1035
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1036 # Get number of Na, Nb and Nc bits in bit vector A and B to be used for similarity coefficient calculations...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1037 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1038 sub _GetNumOfIndividualAndCommonClearBits ($$) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1039 my($FingerprintsBitVectorA, $FingerprintsBitVectorB) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1040 my($Na, $Nb, $Nc, $Nd);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1041
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1042 # Number of bits set to "0" in A
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1043 $Na = $FingerprintsBitVectorA->GetNumOfClearBits();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1044
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1045 # Correct for number of clear bits used for padding...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1046 if (_IsNumOfClearBitsCorrectionRequired($FingerprintsBitVectorA)) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1047 $Na = $Na - _GetNumOfClearBitsCorrection($FingerprintsBitVectorA);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1048 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1049
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1050 # Number of bits set to "0" in B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1051 $Nb = $FingerprintsBitVectorB->GetNumOfClearBits();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1052
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1053 # Correct for number of clear bits used for padding...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1054 if (_IsNumOfClearBitsCorrectionRequired($FingerprintsBitVectorB)) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1055 $Nb = $Nb - _GetNumOfClearBitsCorrection($FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1056 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1057
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1058 # Number of bits set to "0" in both A and B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1059 $Nc = _GetNumOfCommonClearBits($FingerprintsBitVectorA, $FingerprintsBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1060
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1061 return ($Na, $Nb, $Nc);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1062 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1063
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1064 # Irrespective of specified size, Perl functions used to handle bit data data in
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1065 # BitVector class automatically sets the size to the next nearest power of 2
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1066 # and clear the extra bits.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1067 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1068 # SpecifiedSize is used by this class to process any aribitray size during similarity
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1069 # coefficient calculations.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1070 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1071 # Assuming the FingerprintsBitBector class only manipulates bits upto specified
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1072 # size, a correction for the extra bits added by BitVector class needs to be applied
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1073 # to number of clear bits.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1074 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1075 sub _GetNumOfClearBitsCorrection {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1076 my($FingerprintsBitVector) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1077
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1078 return ($FingerprintsBitVector->{Size} - $FingerprintsBitVector->{SpecifiedSize});
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1079 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1080
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1081 # Is number of clear bits correction required?
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1082 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1083 sub _IsNumOfClearBitsCorrectionRequired {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1084 my($FingerprintsBitVector) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1085
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1086 return ($FingerprintsBitVector->{Size} > $FingerprintsBitVector->{SpecifiedSize}) ? 1 : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1087 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1088
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1089
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1090 1;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1091
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1092 __END__
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1093
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1094 =head1 NAME
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1095
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1096 FingerprintsBitVector
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1097
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1098 =head1 SYNOPSIS
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1099
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1100 use Fingerprints::FingerprintsBitVector;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1101
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1102 use Fingerprints::FingerprintsBitVector qw(:coefficients);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1103
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1104 use Fingerprints::FingerprintsBitVector qw(:all);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1105
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1106 =head1 DESCRIPTION
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1107
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1108 B<FingerprintsBitVector> class provides the following methods:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1109
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1110 new, BaroniUrbaniSimilarityCoefficient, BuserSimilarityCoefficient,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1111 CosineSimilarityCoefficient, DennisSimilarityCoefficient,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1112 DiceSimilarityCoefficient, FoldFingerprintsBitVectorByDensity,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1113 FoldFingerprintsBitVectorBySize, ForbesSimilarityCoefficient,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1114 FossumSimilarityCoefficient, GetBitsAsBinaryString, GetBitsAsDecimalString,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1115 GetBitsAsHexadecimalString, GetBitsAsOctalString, GetBitsAsRawBinaryString,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1116 GetDescription, GetFingerprintsBitDensity, GetID, GetSpecifiedSize,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1117 GetSupportedSimilarityCoefficients, GetVectorType, HamannSimilarityCoefficient,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1118 IsFingerprintsBitVector, IsSubSet, JacardSimilarityCoefficient,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1119 Kulczynski1SimilarityCoefficient, Kulczynski2SimilarityCoefficient,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1120 MatchingSimilarityCoefficient, McConnaugheySimilarityCoefficient,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1121 NewFromBinaryString, NewFromDecimalString, NewFromHexadecimalString,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1122 NewFromOctalString, NewFromRawBinaryString, OchiaiSimilarityCoefficient,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1123 PearsonSimilarityCoefficient, RogersTanimotoSimilarityCoefficient,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1124 RussellRaoSimilarityCoefficient, SetDescription, SetID, SetSpecifiedSize,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1125 SetVectorType, SimpsonSimilarityCoefficient, SkoalSneath1SimilarityCoefficient,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1126 SkoalSneath2SimilarityCoefficient, SkoalSneath3SimilarityCoefficient,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1127 StringifyFingerprintsBitVector, TanimotoSimilarityCoefficient,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1128 TverskySimilarityCoefficient, WeightedTanimotoSimilarityCoefficient,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1129 WeightedTverskySimilarityCoefficient, YuleSimilarityCoefficient
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1130
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1131 The methods available to create fingerprints bit vector from strings and to calculate similarity
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1132 coefficient between two bit vectors can also be invoked as class functions.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1133
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1134 B<FingerprintsBitVector> class is derived from B<BitVector> class which provides the functionality
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1135 to manipulate bits.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1136
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1137 For two fingerprints bit vectors A and B of same size, let:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1138
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1139 Na = Number of bits set to "1" in A
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1140 Nb = Number of bits set to "1" in B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1141 Nc = Number of bits set to "1" in both A and B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1142 Nd = Number of bits set to "0" in both A and B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1143
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1144 Nt = Number of bits set to "1" or "0" in A or B (Size of A or B)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1145 Nt = Na + Nb - Nc + Nd
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1146
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1147 Na - Nc = Number of bits set to "1" in A but not in B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1148 Nb - Nc = Number of bits set to "1" in B but not in A
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1149
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1150 Then, various similarity coefficients [ Ref. 40 - 42 ] for a pair of bit vectors A and B are
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1151 defined as follows:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1152
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1153 BaroniUrbani: ( SQRT( Nc * Nd ) + Nc ) / ( SQRT ( Nc * Nd ) + Nc + ( Na - Nc ) + ( Nb - Nc ) ) ( same as Buser )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1154
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1155 Buser: ( SQRT ( Nc * Nd ) + Nc ) / ( SQRT ( Nc * Nd ) + Nc + ( Na - Nc ) + ( Nb - Nc ) ) ( same as BaroniUrbani )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1156
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1157 Cosine: Nc / SQRT ( Na * Nb ) (same as Ochiai)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1158
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1159 Dice: (2 * Nc) / ( Na + Nb )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1160
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1161 Dennis: ( Nc * Nd - ( ( Na - Nc ) * ( Nb - Nc ) ) ) / SQRT ( Nt * Na * Nb)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1162
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1163 Forbes: ( Nt * Nc ) / ( Na * Nb )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1164
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1165 Fossum: ( Nt * ( ( Nc - 1/2 ) ** 2 ) / ( Na * Nb )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1166
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1167 Hamann: ( ( Nc + Nd ) - ( Na - Nc ) - ( Nb - Nc ) ) / Nt
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1168
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1169 Jaccard: Nc / ( ( Na - Nc) + ( Nb - Nc ) + Nc ) = Nc / ( Na + Nb - Nc ) (same as Tanimoto)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1170
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1171 Kulczynski1: Nc / ( ( Na - Nc ) + ( Nb - Nc) ) = Nc / ( Na + Nb - 2Nc )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1172
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1173 Kulczynski2: ( ( Nc / 2 ) * ( 2 * Nc + ( Na - Nc ) + ( Nb - Nc) ) ) / ( ( Nc + ( Na - Nc ) ) * ( Nc + ( Nb - Nc ) ) )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1174 = 0.5 * ( Nc / Na + Nc / Nb )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1175
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1176 Matching: ( Nc + Nd ) / Nt
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1177
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1178 McConnaughey: ( Nc ** 2 - ( Na - Nc ) * ( Nb - Nc) ) / ( Na * Nb )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1179
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1180 Ochiai: Nc / SQRT ( Na * Nb ) (same as Cosine)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1181
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1182 Pearson: ( ( Nc * Nd ) - ( ( Na - Nc ) * ( Nb - Nc ) ) / SQRT ( Na * Nb * ( Na - Nc + Nd ) * ( Nb - Nc + Nd ) )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1183
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1184 RogersTanimoto: ( Nc + Nd ) / ( ( Na - Nc) + ( Nb - Nc) + Nt) = ( Nc + Nd ) / ( Na + Nb - 2Nc + Nt)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1185
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1186 RussellRao: Nc / Nt
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1187
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1188 Simpson: Nc / MIN ( Na, Nb)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1189
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1190 SkoalSneath1: Nc / ( Nc + 2 * ( Na - Nc) + 2 * ( Nb - Nc) ) = Nc / ( 2 * Na + 2 * Nb - 3 * Nc )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1191
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1192 SkoalSneath2: ( 2 * Nc + 2 * Nd ) / ( Nc + Nd + Nt )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1193
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1194 SkoalSneath3: ( Nc + Nd ) / ( ( Na - Nc ) + ( Nb - Nc ) ) = ( Nc + Nd ) / ( Na + Nb - 2 * Nc )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1195
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1196 Tanimoto: Nc / ( ( Na - Nc) + ( Nb - Nc ) + Nc ) = Nc / ( Na + Nb - Nc ) (same as Jaccard)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1197
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1198 Tversky: Nc / ( alpha * ( Na - Nc ) + ( 1 - alpha) * ( Nb - Nc) + Nc ) = Nc / ( alpha * ( Na - Nb ) + Nb)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1199
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1200 Yule: ( ( Nc * Nd ) - ( ( Na - Nc ) * ( Nb - Nc ) ) ) / ( ( Nc * Nd ) + ( ( Na - Nc ) * ( Nb - Nc ) ) )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1201
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1202 The values of Tanimoto/Jaccard and Tversky coefficients are dependent on only those bit which
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1203 are set to "1" in both A and B. In order to take into account all bit positions, modified versions
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1204 of Tanimoto [ Ref. 42 ] and Tversky [ Ref. 43 ] have been developed.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1205
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1206 Let:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1207
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1208 Na' = Number of bits set to "0" in A
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1209 Nb' = Number of bits set to "0" in B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1210 Nc' = Number of bits set to "0" in both A and B
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1211
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1212 Tanimoto': Nc' / ( ( Na' - Nc') + ( Nb' - Nc' ) + Nc' ) = Nc' / ( Na' + Nb' - Nc' )
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1213
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1214 Tversky': Nc' / ( alpha * ( Na' - Nc' ) + ( 1 - alpha) * ( Nb' - Nc' ) + Nc' ) = Nc' / ( alpha * ( Na' - Nb' ) + Nb')
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1215
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1216 Then:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1217
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1218 WeightedTanimoto = beta * Tanimoto + (1 - beta) * Tanimoto'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1219
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1220 WeightedTversky = beta * Tversky + (1 - beta) * Tversky'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1221
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1222 =head2 METHODS
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1223
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1224 =over 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1225
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1226 =item B<new>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1227
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1228 $NewFPBitVector = new Fingerprints::FingerprintsBitVector($Size);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1229
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1230 Creates a new I<FingerprintsBitVector> object of size I<Size> and returns newly created
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1231 B<FingerprintsBitVector>. Bit numbers range from 0 to 1 less than I<Size>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1232
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1233 =item B<BaroniUrbaniSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1234
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1235 $Value = $FingerprintsBitVector->BaroniUrbaniSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1236 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1237 $Value = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1238 BaroniUrbaniSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1239 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1240
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1241 Returns value of I<BaroniUrbani> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1242
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1243 =item B<BuserSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1244
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1245 $Value = $FingerprintsBitVector->BuserSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1246 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1247 $Value = Fingerprints::FingerprintsBitVector::BuserSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1248 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1249
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1250 Returns value of I<Buser> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1251
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1252 =item B<CosineSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1253
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1254 $Value = $FingerprintsBitVector->CosineSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1255 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1256 $Value = Fingerprints::FingerprintsBitVector::CosineSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1257 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1258
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1259 Returns value of I<Cosine> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1260
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1261 =item B<DennisSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1262
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1263 $Value = $FingerprintsBitVector->DennisSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1264 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1265 $Value = Fingerprints::FingerprintsBitVector::DennisSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1266 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1267
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1268 Returns value of I<Dennis> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1269
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1270 =item B<DiceSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1271
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1272 $Value = $FingerprintsBitVector->DiceSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1273 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1274 $Value = Fingerprints::FingerprintsBitVector::DiceSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1275 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1276
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1277 Returns value of I<Dice> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1278
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1279 =item B<FoldFingerprintsBitVectorByDensity>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1280
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1281 $FingerprintsBitVector->FoldFingerprintsBitVectorByDensity($Density);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1282
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1283 Folds I<FingerprintsBitVector> by recursively reducing its size by half until bit density of set bits is
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1284 greater than or equal to specified I<Density> and returns folded I<FingerprintsBitVector>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1285
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1286 =item B<FoldFingerprintsBitVectorBySize>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1287
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1288 $FingerprintsBitVector->FoldFingerprintsBitVectorBySize($Size);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1289
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1290 Folds I<FingerprintsBitVector> by recursively reducing its size by half until size is less than or equal to
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1291 specified I<Size> and returns folded I<FingerprintsBitVector>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1292
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1293 =item B<ForbesSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1294
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1295 $Value = $FingerprintsBitVector->ForbesSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1296 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1297 $Value = Fingerprints::FingerprintsBitVector::ForbesSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1298 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1299
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1300 Returns value of I<Forbes> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1301
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1302 =item B<FossumSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1303
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1304 $Value = $FingerprintsBitVector->FossumSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1305 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1306 $Value = Fingerprints::FingerprintsBitVector::FossumSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1307 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1308
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1309 Returns value of I<Fossum> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1310
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1311 =item B<GetBitsAsBinaryString>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1312
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1313 $BinaryASCIIString = $FingerprintsBitVector->GetBitsAsBinaryString();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1314
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1315 Returns fingerprints as a binary ASCII string containing 0s and 1s.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1316
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1317 =item B<GetBitsAsHexadecimalString>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1318
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1319 $HexadecimalString = $FingerprintsBitVector->GetBitsAsHexadecimalString();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1320
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1321 Returns fingerprints as a hexadecimal string.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1322
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1323 =item B<GetBitsAsRawBinaryString>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1324
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1325 $RawBinaryString = $FingerprintsBitVector->GetBitsAsRawBinaryString();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1326
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1327 Returns fingerprints as a raw binary string containing packed bit values for each byte.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1328
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1329 =item B<GetDescription>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1330
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1331 $Description = $FingerprintsBitVector->GetDescription();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1332
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1333 Returns a string containing description of fingerprints bit vector.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1334
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1335 =item B<GetFingerprintsBitDensity>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1336
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1337 $BitDensity = $FingerprintsBitVector->GetFingerprintsBitDensity();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1338
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1339 Returns I<BitDensity> of I<FingerprintsBitVector> corresponding to bits set to 1s.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1340
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1341 =item B<GetID>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1342
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1343 $ID = $FingerprintsBitVector->GetID();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1344
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1345 Returns I<ID> of I<FingerprintsBitVector>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1346
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1347 =item B<GetVectorType>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1348
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1349 $VectorType = $FingerprintsBitVector->GetVectorType();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1350
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1351 Returns I<VectorType> of I<FingerprintsBitVector>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1352
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1353 =item B<GetSpecifiedSize>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1354
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1355 $Size = $FingerprintsBitVector->GetSpecifiedSize();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1356
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1357 Returns value of specified size for bit vector.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1358
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1359 =item B<GetSupportedSimilarityCoefficients>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1360
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1361 @SimilarityCoefficient =
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1362 Fingerprints::FingerprintsBitVector::GetSupportedSimilarityCoefficients();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1363
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1364 Returns an array containing names of supported similarity coefficients.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1365
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1366 =item B<HamannSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1367
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1368 $Value = $FingerprintsBitVector->HamannSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1369 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1370 $Value = Fingerprints::FingerprintsBitVector::HamannSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1371 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1372
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1373 Returns value of I<Hamann> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1374
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1375 =item B<IsFingerprintsBitVector>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1376
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1377 $Status = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1378 IsFingerprintsBitVector($Object);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1379
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1380 Returns 1 or 0 based on whether I<Object> is a B<FingerprintsBitVector> object.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1381
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1382 =item B<IsSubSet>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1383
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1384 $Status = $FingerprintsBitVector->IsSubSet($OtherFPBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1385 $Status = Fingerprints::FingerprintsBitVector::IsSubSet(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1386 $FPBitVectorA, $FPBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1387
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1388 Returns 1 or 0 based on whether first firngerprints bit vector is a subset of second
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1389 fingerprints bit vector.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1390
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1391 For a bit vector to be a subset of another bit vector, both vectors must be of
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1392 the same size and the bit positions set in first vector must also be set in the
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1393 second bit vector.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1394
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1395 =item B<JacardSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1396
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1397 $Value = $FingerprintsBitVector->JacardSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1398 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1399 $Value = Fingerprints::FingerprintsBitVector::JacardSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1400 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1401
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1402 Returns value of I<Jacard> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1403
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1404 =item B<Kulczynski1SimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1405
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1406 $Value = $FingerprintsBitVector->Kulczynski1SimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1407 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1408 $Value = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1409 Kulczynski1SimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1410 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1411
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1412 Returns value of I<Kulczynski1> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1413
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1414 =item B<Kulczynski2SimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1415
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1416 $Value = $FingerprintsBitVector->Kulczynski2SimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1417 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1418 $Value = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1419 Kulczynski2SimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1420 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1421
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1422 Returns value of I<Kulczynski2> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1423
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1424 =item B<MatchingSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1425
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1426 $Value = $FingerprintsBitVector->MatchingSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1427 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1428 $Value = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1429 MatchingSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1430 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1431
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1432 Returns value of I<Matching> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1433
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1434 =item B<McConnaugheySimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1435
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1436 $Value = $FingerprintsBitVector->McConnaugheySimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1437 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1438 $Value = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1439 McConnaugheySimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1440 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1441
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1442 Returns value of I<McConnaughey> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1443
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1444 =item B<NewFromBinaryString>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1445
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1446 $NewFPBitVector = $FingerprintsBitVector->NewFromBinaryString(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1447 $BinaryString);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1448 $NewFPBitVector = Fingerprints::FingerprintsBitVector::NewFromBinaryString(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1449 $BinaryString);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1450
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1451 Creates a new I<FingerprintsBitVector> using I<BinaryString> and returns new
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1452 B<FingerprintsBitVector> object.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1453
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1454 =item B<NewFromHexadecimalString>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1455
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1456 $NewFPBitVector = $FingerprintsBitVector->NewFromHexadecimalString(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1457 $HexdecimalString);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1458 $NewFPBitVector = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1459 NewFromHexadecimalString(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1460 $HexdecimalString);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1461
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1462 Creates a new I<FingerprintsBitVector> using I<HexdecimalString> and returns new
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1463 B<FingerprintsBitVector> object.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1464
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1465 =item B<NewFromRawBinaryString>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1466
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1467 $NewFPBitVector = $FingerprintsBitVector->NewFromRawBinaryString(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1468 $RawBinaryString);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1469 $NewFPBitVector = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1470 NewFromRawBinaryString(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1471 $RawBinaryString);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1472
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1473 Creates a new I<FingerprintsBitVector> using I<RawBinaryString> and returns new
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1474 B<FingerprintsBitVector> object.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1475
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1476 =item B<OchiaiSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1477
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1478 $Value = $FingerprintsBitVector->OchiaiSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1479 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1480 $Value = Fingerprints::FingerprintsBitVector::OchiaiSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1481 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1482
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1483 Returns value of I<Ochiai> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1484
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1485 =item B<PearsonSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1486
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1487 $Value = $FingerprintsBitVector->PearsonSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1488 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1489 $Value = Fingerprints::FingerprintsBitVector::PearsonSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1490 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1491
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1492 Returns value of I<Pearson> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1493
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1494 =item B<RogersTanimotoSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1495
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1496 $Value = $FingerprintsBitVector->RogersTanimotoSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1497 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1498 $Value = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1499 RogersTanimotoSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1500 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1501
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1502 Returns value of I<RogersTanimoto> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1503
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1504 =item B<RussellRaoSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1505
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1506 $Value = $FingerprintsBitVector->RussellRaoSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1507 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1508 $Value = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1509 RussellRaoSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1510 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1511
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1512 Returns value of I<RussellRao> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1513
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1514 =item B<SetSpecifiedSize>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1515
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1516 $FingerprintsBitVector->SetSpecifiedSize($Size);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1517
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1518 Sets specified size for fingerprints bit vector.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1519
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1520 Irrespective of specified size, Perl functions used to handle bit data in B<BitVector> class
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1521 automatically sets the size to the next nearest power of 2. I<SpecifiedSize> is used by
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1522 B<FingerprintsBitVector> class to process any aribitray size during similarity coefficient calculations.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1523
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1524 =item B<SetDescription>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1525
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1526 $FingerprintsBitVector->SetDescription($Description);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1527
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1528 Sets I<Description> of fingerprints bit vector and returns I<FingerprintsBitVector>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1529
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1530 =item B<SetID>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1531
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1532 $FingerprintsBitVector->SetID($ID);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1533
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1534 Sets I<ID> of fingerprints bit vector and returns I<FingerprintsBitVector>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1535
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1536 =item B<SetVectorType>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1537
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1538 $FingerprintsBitVector->SetVectorType($VectorType);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1539
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1540 Sets I<VectorType> of fingerprints bit vector and returns I<FingerprintsBitVector>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1541
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1542 =item B<SimpsonSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1543
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1544 $Value = $FingerprintsBitVector->SimpsonSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1545 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1546 $Value = Fingerprints::FingerprintsBitVector::SimpsonSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1547 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1548
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1549 Returns value of I<Simpson> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1550
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1551 =item B<SkoalSneath1SimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1552
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1553 $Value = $FingerprintsBitVector->SkoalSneath1SimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1554 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1555 $Value = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1556 SkoalSneath1SimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1557 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1558
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1559 Returns value of I<SkoalSneath1> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1560
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1561 =item B<SkoalSneath2SimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1562
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1563 $Value = $FingerprintsBitVector->SkoalSneath2SimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1564 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1565 $Value = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1566 SkoalSneath2SimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1567 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1568
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1569 Returns value of I<SkoalSneath2> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1570
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1571 =item B<SkoalSneath3SimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1572
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1573 $Value = $FingerprintsBitVector->SkoalSneath3SimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1574 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1575 $Value = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1576 SkoalSneath3SimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1577 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1578
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1579 Returns value of I<SkoalSneath3> similarity coefficient between two same size I<FingerprintsBitVectors>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1580
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1581 =item B<StringifyFingerprintsBitVector>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1582
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1583 $String = $FingerprintsBitVector->StringifyFingerprintsBitVector();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1584
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1585 Returns a string containing information about I<FingerprintsBitVector> object.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1586
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1587 =item B<TanimotoSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1588
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1589 $Value = $FingerprintsBitVector->TanimotoSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1590 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1591 $Value = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1592 TanimotoSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1593 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1594
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1595 Returns value of I<Tanimoto> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1596
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1597 =item B<TverskySimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1598
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1599 $Value = $FingerprintsBitVector->TverskySimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1600 $OtherFingerprintBitVector, $Alpha);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1601 $Value = Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1602 TverskySimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1603 $FingerprintsBitVectorA, $FingerprintBitVectorB, $Alpha);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1604
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1605 Returns value of I<Tversky> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1606
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1607 =item B<WeightedTanimotoSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1608
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1609 $Value =
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1610 $FingerprintsBitVector->WeightedTanimotoSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1611 $OtherFingerprintBitVector, $Beta);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1612 $Value =
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1613 Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1614 WeightedTanimotoSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1615 $FingerprintsBitVectorA, $FingerprintBitVectorB, $Beta);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1616
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1617 Returns value of I<WeightedTanimoto> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1618
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1619 =item B<WeightedTverskySimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1620
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1621 $Value =
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1622 $FingerprintsBitVector->WeightedTverskySimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1623 $OtherFingerprintBitVector, $Alpha, $Beta);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1624 $Value =
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1625 Fingerprints::FingerprintsBitVector::
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1626 WeightedTverskySimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1627 $FingerprintsBitVectorA, $FingerprintBitVectorB, $Alpha, $Beta);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1628
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1629 Returns value of I<WeightedTversky> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1630
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1631 =item B<YuleSimilarityCoefficient>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1632
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1633 $Value = $FingerprintsBitVector->YuleSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1634 $OtherFingerprintBitVector);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1635 $Value = Fingerprints::FingerprintsBitVector::YuleSimilarityCoefficient(
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1636 $FingerprintsBitVectorA, $FingerprintBitVectorB);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1637
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1638 Returns value of I<Yule> similarity coefficient between two same size I<FingerprintsBitVectors>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1639
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1640 =back
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1641
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1642 =head1 AUTHOR
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1643
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1644 Manish Sud <msud@san.rr.com>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1645
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1646 =head1 SEE ALSO
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1647
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1648 BitVector.pm, FingerprintsStringUtil.pm, FingerprintsVector.pm, Vector.pm
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1649
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1650 =head1 COPYRIGHT
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1651
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1652 Copyright (C) 2015 Manish Sud. All rights reserved.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1653
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1654 This file is part of MayaChemTools.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1655
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1656 MayaChemTools is free software; you can redistribute it and/or modify it under
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1657 the terms of the GNU Lesser General Public License as published by the Free
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1658 Software Foundation; either version 3 of the License, or (at your option)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1659 any later version.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1660
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1661 =cut