annotate mayachemtools/bin/InfoFingerprintsFiles.pl @ 0:73ae111cf86f draft

Uploaded
author deepakjadmin
date Wed, 20 Jan 2016 11:55:01 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
1 #!/usr/bin/perl -w
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
2 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
3 # $RCSfile: InfoFingerprintsFiles.pl,v $
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
4 # $Date: 2015/02/28 20:46:20 $
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
5 # $Revision: 1.20 $
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
6 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
7 # Author: Manish Sud <msud@san.rr.com>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
8 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
9 # Copyright (C) 2015 Manish Sud. All rights reserved.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
10 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
11 # This file is part of MayaChemTools.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
12 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
13 # MayaChemTools is free software; you can redistribute it and/or modify it under
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
14 # the terms of the GNU Lesser General Public License as published by the Free
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
15 # Software Foundation; either version 3 of the License, or (at your option) any
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
16 # later version.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
17 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
18 # MayaChemTools is distributed in the hope that it will be useful, but without
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
19 # any warranty; without even the implied warranty of merchantability of fitness
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
20 # for a particular purpose. See the GNU Lesser General Public License for more
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
21 # details.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
22 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
23 # You should have received a copy of the GNU Lesser General Public License
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
24 # along with MayaChemTools; if not, see <http://www.gnu.org/licenses/> or
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
25 # write to the Free Software Foundation Inc., 59 Temple Place, Suite 330,
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
26 # Boston, MA, 02111-1307, USA.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
27 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
28
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
29 use strict;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
30 use FindBin; use lib "$FindBin::Bin/../lib";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
31 use Getopt::Long;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
32 use File::Basename;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
33 use Text::ParseWords;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
34 use Benchmark;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
35 use FileUtil;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
36 use TextUtil;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
37 use Fingerprints::FingerprintsFileUtil;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
38 use Fingerprints::FingerprintsStringUtil;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
39
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
40 my($ScriptName, %Options, $StartTime, $EndTime, $TotalTime);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
41
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
42 # Autoflush STDOUT
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
43 $| = 1;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
44
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
45 # Starting message...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
46 $ScriptName = basename($0);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
47 print "\n$ScriptName: Starting...\n\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
48 $StartTime = new Benchmark;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
49
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
50 # Get the options and setup script...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
51 SetupScriptUsage();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
52 if ($Options{help} || @ARGV < 1) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
53 die GetUsageFromPod("$FindBin::Bin/$ScriptName");
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
54 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
55
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
56 my(@FingerprintsFilesList);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
57 @FingerprintsFilesList = ExpandFileNames(\@ARGV, "sdf sd fpf fp csv tsv");
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
58
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
59 # Process options...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
60 print "Processing options...\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
61 my(%OptionsInfo);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
62 ProcessOptions();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
63
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
64 # Setup information about input files...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
65 print "Checking input fingerprints file(s)...\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
66 my(%FingerprintsFilesInfo);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
67 RetrieveFingerprintsFilesInfo();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
68
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
69 # Process input files..
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
70 my($FileIndex);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
71 if (@FingerprintsFilesList > 1) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
72 print "\nProcessing fingerprints files...\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
73 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
74 for $FileIndex (0 .. $#FingerprintsFilesList) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
75 if ($FingerprintsFilesInfo{FileOkay}[$FileIndex]) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
76 print "\nProcessing file $FingerprintsFilesList[$FileIndex]...\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
77 ListFingerprintsFileInfo($FileIndex);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
78 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
79 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
80 ListTotalSizeOfFiles();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
81
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
82 print "\n$ScriptName:Done...\n\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
83
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
84 $EndTime = new Benchmark;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
85 $TotalTime = timediff ($EndTime, $StartTime);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
86 print "Total time: ", timestr($TotalTime), "\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
87
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
88 ###############################################################################
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
89
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
90 # List approptiate information...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
91 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
92 sub ListFingerprintsFileInfo {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
93 my($FileIndex) = @_;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
94 my($FileName, $FingerprintsFileIO, $InvalidFingerprintsFileData, $InvalidFingerprintsData, $DataEntryCount, $ValidDataEntryCount, $InvalidDataEntryCount, $MissingDataEntryCount, $BitVectorDataEntryCount, $VectorDataEntryCount, $FingerprintsObject, $FingerprintsType, $TotalBitDensity, $FileType, $DataEntryLabel);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
95
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
96 $FileType = $FingerprintsFilesInfo{FileType}[$FileIndex];
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
97 $DataEntryLabel = ($FileType =~ /^SD$/i) ? 'compounds' : 'lines';
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
98
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
99 ($DataEntryCount, $ValidDataEntryCount, $InvalidDataEntryCount, $MissingDataEntryCount, $BitVectorDataEntryCount, $VectorDataEntryCount, $TotalBitDensity) = (0) x 7;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
100
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
101 $FingerprintsFileIO = Fingerprints::FingerprintsFileUtil::NewFingerprintsFileIO(%{$FingerprintsFilesInfo{FingerprintsFileIOParameters}[$FileIndex]});
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
102 $FingerprintsFileIO->Open();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
103
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
104 $InvalidFingerprintsFileData = $FingerprintsFileIO->IsFingerprintsFileDataValid() ? 0 : 1;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
105
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
106 FINGERPRINTS: while ($FingerprintsFileIO->Read()) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
107 $DataEntryCount++;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
108
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
109 # Missing data...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
110 if ($InvalidFingerprintsFileData) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
111 $MissingDataEntryCount++;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
112 if ($OptionsInfo{ValidateData} || $OptionsInfo{CountEmptyFingerprints}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
113 ListEmptyOrInvalidFingerprintsDataInfo('EmptyData', $FingerprintsFileIO, $FileType);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
114 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
115 next FINGERPRINTS;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
116 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
117 $InvalidFingerprintsData = $FingerprintsFileIO->IsFingerprintsDataValid() ? 0 : 1;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
118
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
119 # Invalid data...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
120 if ($InvalidFingerprintsData) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
121 $InvalidDataEntryCount++;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
122 if ($OptionsInfo{ValidateData}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
123 ListEmptyOrInvalidFingerprintsDataInfo('InvalidData', $FingerprintsFileIO, $FileType);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
124 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
125 next FINGERPRINTS;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
126 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
127 $ValidDataEntryCount++;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
128
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
129 $FingerprintsObject = $FingerprintsFileIO->GetFingerprints();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
130 $FingerprintsType = $FingerprintsObject->GetVectorType();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
131
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
132 if ($FingerprintsType =~ /^FingerprintsBitVector$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
133 $BitVectorDataEntryCount++;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
134 if ($OptionsInfo{ListAverageBitDensity}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
135 $TotalBitDensity += $FingerprintsObject->GetFingerprintsBitDensity();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
136 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
137 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
138 elsif ($FingerprintsType =~ /^FingerprintsVector$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
139 $VectorDataEntryCount++;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
140 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
141
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
142 if ($OptionsInfo{ListFingerprintsDataEntryInfo}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
143 ListFingerprintsDataEntryInfo($FingerprintsFileIO, $FileType);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
144 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
145
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
146 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
147 $FingerprintsFileIO->Close();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
148
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
149 print "\nFingerprints file type: $FileType\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
150 if ($FileType =~ /^SD$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
151 print "Number of compounds: $DataEntryCount\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
152 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
153 else {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
154 print "Number of data lines: $DataEntryCount\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
155 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
156
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
157 ListFileTypeHeaderInfo($FingerprintsFileIO, $FileType);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
158
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
159 print "\nNumber of $DataEntryLabel with valid fingerprints string data: $ValidDataEntryCount\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
160 print "Number of $DataEntryLabel with bit-vector fingerprints string data: $BitVectorDataEntryCount\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
161 print "Number of $DataEntryLabel with vector fingerprints string data: $VectorDataEntryCount\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
162
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
163 if ($OptionsInfo{CountEmptyFingerprints}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
164 print "Number of $DataEntryLabel with missing fingerprints data: $MissingDataEntryCount\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
165 print "Number of $DataEntryLabel with invalid fingerprints data: $InvalidDataEntryCount\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
166 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
167
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
168 if ($OptionsInfo{ListAverageBitDensity} && $BitVectorDataEntryCount) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
169 my($AverageBitDensity);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
170 $AverageBitDensity = $TotalBitDensity/$BitVectorDataEntryCount;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
171 $AverageBitDensity = sprintf("%.2f", $AverageBitDensity) + 0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
172 print "\nAverage bit density: $AverageBitDensity\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
173 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
174
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
175
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
176 # File size and modification information...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
177 print "\nFile size: ", FormatFileSize($FingerprintsFilesInfo{FileSize}[$FileIndex]), " \n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
178 print "Last modified: ", $FingerprintsFilesInfo{FileLastModified}[$FileIndex], " \n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
179 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
180
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
181 # List empty or invalid fingerprints file data information...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
182 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
183 sub ListEmptyOrInvalidFingerprintsDataInfo {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
184 my($Mode, $FingerprintsFileIO, $FileType) = @_;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
185 my($ModeInfo);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
186
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
187 $ModeInfo = ($Mode =~ /^EmptyData$/i) ? "no" : "invalid";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
188
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
189 if ($FileType =~ /^SD$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
190 my($CmpdNum, $CmpdString);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
191
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
192 $CmpdNum = $FingerprintsFileIO->GetCompoundNum();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
193 if ($OptionsInfo{DetailLevel} >= 3 ) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
194 $CmpdString = $FingerprintsFileIO->GetCompoundString();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
195 print "Compound number $CmpdNum contains $ModeInfo fingerprints data: $CmpdString \n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
196 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
197 elsif ($OptionsInfo{DetailLevel} >= 1 ) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
198 print "Compound number $CmpdNum contains $ModeInfo fingerprints data...\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
199 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
200 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
201 else {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
202 my($LineNum, $DataLine);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
203
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
204 $LineNum = $FingerprintsFileIO->GetLineNum();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
205 if ($OptionsInfo{DetailLevel} >= 3 ) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
206 $DataLine = $FingerprintsFileIO->GetDataLine();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
207 print "Data line number $LineNum contains $ModeInfo fingerprints data: $DataLine \n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
208 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
209 elsif ($OptionsInfo{DetailLevel} >= 1 ) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
210 print "Data line number $LineNum contains $ModeInfo fingerprints data...\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
211 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
212 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
213 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
214
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
215 # List detailed information about fingerprints data entry...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
216 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
217 sub ListFingerprintsDataEntryInfo {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
218 my($FingerprintsFileIO, $FileType) = @_;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
219 my($FingerprintsObject, $FingerprintsString, $FingerprintsType, $FingerprintsDescription, $FingerprintsSize, $FingerprintsBitStringFormat, $FingerprintsBitOrder, $BitDensity, $NumOfOnBits, $FingerprintsVectorValuesType, $FingerprintsVectorValuesFormat, $NumOfNonZeroValues);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
220
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
221 $FingerprintsObject = $FingerprintsFileIO->GetFingerprints();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
222 $FingerprintsString = $FingerprintsFileIO->GetFingerprintsString();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
223
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
224 $FingerprintsType = $FingerprintsObject->GetVectorType();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
225
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
226 if ($FingerprintsType =~ /^FingerprintsBitVector$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
227 $BitDensity = '';
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
228 $NumOfOnBits = '';
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
229
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
230 ($FingerprintsType, $FingerprintsDescription, $FingerprintsSize, $FingerprintsBitStringFormat, $FingerprintsBitOrder) = Fingerprints::FingerprintsStringUtil::GetFingerprintsStringValues($FingerprintsString);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
231
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
232 if ($OptionsInfo{ListBitDensity} || $OptionsInfo{ListNumOfOnBits}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
233 if ($OptionsInfo{ListBitDensity}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
234 $BitDensity = $FingerprintsObject->GetFingerprintsBitDensity();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
235 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
236 if ($OptionsInfo{ListNumOfOnBits}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
237 $NumOfOnBits = $FingerprintsObject->GetNumOfSetBits();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
238 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
239 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
240 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
241 elsif ($FingerprintsType =~ /^FingerprintsVector$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
242 $NumOfNonZeroValues = '';
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
243
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
244 ($FingerprintsType, $FingerprintsDescription, $FingerprintsSize, $FingerprintsVectorValuesType, $FingerprintsVectorValuesFormat) = Fingerprints::FingerprintsStringUtil::GetFingerprintsStringValues($FingerprintsString);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
245
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
246 if ($OptionsInfo{ListNumOfNonZeroValues}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
247 if ($FingerprintsVectorValuesType =~ /^AlphaNumericalValues$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
248 $NumOfNonZeroValues = 'NA';
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
249 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
250 else {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
251 $NumOfNonZeroValues = $FingerprintsObject->GetNumOfNonZeroValues();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
252 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
253 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
254 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
255
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
256 if ($FileType =~ /^SD$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
257 print "Compound number: " . $FingerprintsFileIO->GetCompoundNum();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
258 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
259 else {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
260 print "Data line number: " . $FingerprintsFileIO->GetLineNum();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
261 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
262
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
263 if ($OptionsInfo{ListFingerprintsType}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
264 print "; FPType: $FingerprintsType";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
265 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
266 if ($OptionsInfo{ListFingerprintsDescription}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
267 print "; FPDescription: $FingerprintsDescription";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
268 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
269 if ($OptionsInfo{ListFingerprintsSize}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
270 print "; FPSize: $FingerprintsSize";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
271 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
272
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
273 if ($FingerprintsType =~ /^FingerprintsBitVector$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
274 if ($OptionsInfo{ListFingerprintsBitStringFormat}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
275 print "; FPBitStringFormat: $FingerprintsBitStringFormat";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
276 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
277 if ($OptionsInfo{ListFingerprintsBitOrder}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
278 print "; FPBitOrder: $FingerprintsBitOrder";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
279 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
280 if ($OptionsInfo{ListBitDensity}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
281 print "; BitDensity: $BitDensity";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
282 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
283 if ($OptionsInfo{ListNumOfOnBits}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
284 print "; NumOfOnBits: $NumOfOnBits";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
285 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
286 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
287 elsif ($FingerprintsType =~ /^FingerprintsVector$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
288 if ($OptionsInfo{ListFingerprintsVectorValuesType}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
289 print "; FPVectorValuesType: $FingerprintsVectorValuesType";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
290 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
291 if ($OptionsInfo{ListFingerprintsVectorValuesFormat}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
292 print "; FPVectorValuesFormat: $FingerprintsVectorValuesFormat";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
293 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
294 if ($OptionsInfo{ListNumOfNonZeroValues}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
295 print "; NumOfNonZeroValues: $NumOfNonZeroValues";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
296 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
297 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
298 print "\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
299 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
300
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
301 # List file type header information...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
302 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
303 sub ListFileTypeHeaderInfo {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
304 my($FingerprintsFileIO, $FileType) = @_;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
305 my($Key, $Value, @DataColLabels, %HeaderDataKeysAndValues);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
306
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
307 if ($FileType =~ /^Text$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
308 @DataColLabels = $FingerprintsFileIO->GetDataColLabels();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
309 print "Number of columns: " . scalar @DataColLabels . "\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
310 print "Column labels: ", JoinWords(\@DataColLabels, ", ", 1), "\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
311 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
312 elsif ($FileType =~ /^FP$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
313 %HeaderDataKeysAndValues = $FingerprintsFileIO->GetHeaderDataKeysAndValues();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
314
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
315 print "\nFP file header data keys and values: \n#\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
316 for $Key ($FingerprintsFileIO->GetHeaderDataKeys()) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
317 $Value = $HeaderDataKeysAndValues{$Key};
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
318 print "# $Key = $Value\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
319 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
320 print "#\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
321 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
322 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
323
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
324 # Total size of all the fiels...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
325 sub ListTotalSizeOfFiles {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
326 my($FileOkayCount, $TotalSize, $Index);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
327
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
328 $FileOkayCount = 0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
329 $TotalSize = 0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
330
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
331 for $Index (0 .. $#FingerprintsFilesList) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
332 if ($FingerprintsFilesList[$Index]) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
333 $FileOkayCount++;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
334 $TotalSize += $FingerprintsFilesInfo{FileSize}[$Index];
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
335 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
336 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
337 if ($FileOkayCount > 1) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
338 print "\nTotal size of $FileOkayCount files: ", FormatFileSize($TotalSize), "\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
339 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
340 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
341
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
342 # Retrieve information about fingerprints files...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
343 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
344 sub RetrieveFingerprintsFilesInfo {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
345 my($FingerprintsFile, $Index, $FileDir, $FileExt, $FileName, $FileType, $InDelim, $ModifiedTimeString, $ModifiedDateString, %FingerprintsFileIOParameters);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
346
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
347 %FingerprintsFilesInfo = ();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
348 @{$FingerprintsFilesInfo{FileOkay}} = ();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
349 @{$FingerprintsFilesInfo{FileType}} = ();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
350 @{$FingerprintsFilesInfo{FileSize}} = ();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
351 @{$FingerprintsFilesInfo{FileLastModified}} = ();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
352 @{$FingerprintsFilesInfo{InDelim}} = ();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
353
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
354 @{$FingerprintsFilesInfo{FingerprintsFileIOParameters}} = ();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
355
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
356 FILELIST: for $Index (0 .. $#FingerprintsFilesList) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
357 $FingerprintsFile = $FingerprintsFilesList[$Index];
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
358
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
359 $FingerprintsFilesInfo{FileOkay}[$Index] = 0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
360 $FingerprintsFilesInfo{FileType}[$Index] = '';
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
361 $FingerprintsFilesInfo{FileSize}[$Index] = 0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
362 $FingerprintsFilesInfo{FileLastModified}[$Index] = '';
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
363 $FingerprintsFilesInfo{InDelim}[$Index] = "";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
364
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
365 %{$FingerprintsFilesInfo{FingerprintsFileIOParameters}[$Index]} = ();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
366
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
367 $FingerprintsFile = $FingerprintsFilesList[$Index];
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
368 if (!(-e $FingerprintsFile)) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
369 warn "Warning: Ignoring file $FingerprintsFile: It doesn't exist\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
370 next FILELIST;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
371 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
372
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
373 $FileType = Fingerprints::FingerprintsFileUtil::GetFingerprintsFileType($FingerprintsFile);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
374 if (IsEmpty($FileType)) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
375 warn "Warning: Ignoring file $FingerprintsFile: It's not a fingerprints file\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
376 next FILELIST;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
377 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
378
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
379 $FileDir = ""; $FileName = ""; $FileExt = "";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
380 ($FileDir, $FileName, $FileExt) = ParseFileName($FingerprintsFile);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
381
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
382 $InDelim = ($FileExt =~ /^tsv$/i) ? 'Tab' : $OptionsInfo{InDelim};
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
383
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
384 # Setup FingerprintsFileIO parameters...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
385 %FingerprintsFileIOParameters = ();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
386 FILEIOPARAMETERS: {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
387 if ($FileType =~ /^SD$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
388 %FingerprintsFileIOParameters = ('Name' => $FingerprintsFile, 'Mode' => 'Read', 'ValidateData' => $OptionsInfo{ValidateData}, 'DetailLevel' => 1, 'FingerprintsFieldLabel' => $OptionsInfo{FingerprintsFieldLabel});
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
389 last FILEIOPARAMETERS;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
390 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
391 if ($FileType =~ /^FP$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
392 %FingerprintsFileIOParameters = ('Name' => $FingerprintsFile, 'Mode' => 'Read', 'ValidateData' => $OptionsInfo{ValidateData}, 'DetailLevel' => 1);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
393 last FILEIOPARAMETERS;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
394 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
395 if ($FileType =~ /^Text$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
396 %FingerprintsFileIOParameters = ('Name' => $FingerprintsFile, 'Mode' => 'Read', 'ValidateData' => $OptionsInfo{ValidateData}, 'DetailLevel' => 1, 'FingerprintsCol' => $OptionsInfo{FingerprintsCol}, 'ColMode' => $OptionsInfo{ColMode}, 'InDelim' => $OptionsInfo{InDelim});
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
397 last FILEIOPARAMETERS;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
398 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
399 warn "Warning: File type for fingerprints file, $FingerprintsFile, is not valid. Supported file types: SD, FP or Text\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
400 next FILELIST;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
401 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
402
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
403 $FingerprintsFilesInfo{FileOkay}[$Index] = 1;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
404 $FingerprintsFilesInfo{FileType}[$Index] = $FileType;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
405
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
406 $FingerprintsFilesInfo{FileSize}[$Index] = FileSize($FingerprintsFile);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
407 ($ModifiedTimeString, $ModifiedDateString) = FormattedFileModificationTimeAndDate($FingerprintsFile);
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
408 $FingerprintsFilesInfo{FileLastModified}[$Index] = "$ModifiedTimeString; $ModifiedDateString";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
409
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
410 $FingerprintsFilesInfo{InDelim}[$Index] = $InDelim;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
411
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
412 %{$FingerprintsFilesInfo{FingerprintsFileIOParameters}[$Index]} = %FingerprintsFileIOParameters;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
413 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
414 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
415
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
416 # Process option values...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
417 sub ProcessOptions {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
418 %OptionsInfo = ();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
419
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
420 $OptionsInfo{ListAverageBitDensity} = ($Options{all} || $Options{averagebitdensity}) ? 1 :0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
421 $OptionsInfo{ListBitDensity} = ($Options{all} || $Options{bitdensity}) ? 1 :0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
422
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
423 if ($OptionsInfo{ListAverageBitDensity}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
424 # List bit density as well...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
425 $OptionsInfo{ListBitDensity} = 1;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
426 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
427
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
428 # By default, count number of rows containing fingerprints data...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
429 $OptionsInfo{CountFingerprints} = 1;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
430 $OptionsInfo{CountEmptyFingerprints} = ($Options{all} || $Options{empty}) ? 1 :0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
431
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
432 $OptionsInfo{ColMode} = $Options{colmode};
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
433 if (IsNotEmpty($Options{fingerprintscol})) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
434 if ($Options{colmode} =~ /^ColNum$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
435 if (!IsPositiveInteger($Options{fingerprintscol})) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
436 die "Error: Column value, $Options{fingerprintscol}, specified using \"--FingerprintsCol\" is not valid: Allowed integer values: > 0.\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
437 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
438 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
439 $OptionsInfo{FingerprintsCol} = $Options{fingerprintscol};
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
440 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
441 else {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
442 $OptionsInfo{FingerprintsCol} = 'AutoDetect';
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
443 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
444
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
445 if (IsNotEmpty($Options{fingerprintsfield})) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
446 $OptionsInfo{FingerprintsFieldLabel} = $Options{fingerprintsfield};
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
447 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
448 else {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
449 $OptionsInfo{FingerprintsFieldLabel} = 'AutoDetect';
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
450 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
451
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
452 $OptionsInfo{ValidateData} = ($Options{all} || $Options{datacheck}) ? 1 :0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
453 $OptionsInfo{DetailLevel} = $Options{detail};
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
454
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
455 $OptionsInfo{ListFingerprintsType} = ($Options{all} || $Options{fingerprintstype}) ? 1 :0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
456 $OptionsInfo{ListFingerprintsDescription} = ($Options{all} || $Options{fingerprintsdescription}) ? 1 :0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
457 $OptionsInfo{ListFingerprintsSize} = ($Options{all} || $Options{fingerprintssize}) ? 1 :0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
458
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
459 $OptionsInfo{ListFingerprintsBitStringFormat} = ($Options{all} || $Options{fingerprintsbitstringformat}) ? 1 :0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
460 $OptionsInfo{ListFingerprintsBitOrder} = ($Options{all} || $Options{fingerprintsbitorder}) ? 1 :0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
461
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
462 $OptionsInfo{ListFingerprintsVectorValuesType} = ($Options{all} || $Options{fingerprintsvectorvaluestype}) ? 1 :0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
463 $OptionsInfo{ListFingerprintsVectorValuesFormat} = ($Options{all} || $Options{fingerprintsvectorvaluesformat}) ? 1 :0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
464
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
465 $OptionsInfo{InDelim} = $Options{indelim};
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
466
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
467 $OptionsInfo{ListNumOfOnBits} = ($Options{all} || $Options{numofonbits}) ? 1 :0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
468 $OptionsInfo{ListNumOfNonZeroValues} = ($Options{all} || $Options{numofnonzerovalues}) ? 1 :0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
469
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
470 $OptionsInfo{ListFingerprintsDataEntryInfo} = ($OptionsInfo{ListFingerprintsType} || $OptionsInfo{ListFingerprintsDescription} || $OptionsInfo{ListFingerprintsSize} || $OptionsInfo{ListFingerprintsBitStringFormat} || $OptionsInfo{ListFingerprintsBitOrder} || $OptionsInfo{ListFingerprintsVectorValuesType} || $OptionsInfo{ListFingerprintsVectorValuesFormat} || $OptionsInfo{ListBitDensity} || $OptionsInfo{ListAverageBitDensity} || $OptionsInfo{ListNumOfOnBits} || $OptionsInfo{ListNumOfNonZeroValues}) ? 1 : 0;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
471
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
472 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
473
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
474 # Setup script usage and retrieve command line arguments specified using various options...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
475 sub SetupScriptUsage {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
476
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
477 # Retrieve all the options...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
478 %Options = ();
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
479
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
480 $Options{colmode} = 'colnum';
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
481 $Options{detail} = 1;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
482 $Options{indelim} = 'comma';
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
483
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
484 if (!GetOptions(\%Options, "all|a", "averagebitdensity", "bitdensity", "count", "colmode|c=s", "detail|d=i", "datacheck", "empty|e", "fingerprintsfield=s", "fingerprintscol=s", "fingerprintstype", "fingerprintsdescription", "fingerprintssize", "fingerprintsbitstringformat", "fingerprintsbitorder", "fingerprintsvectorvaluestype", "fingerprintsvectorvaluesformat", "help|h", "indelim=s", "numofonbits", "numofnonzerovalues", "workingdir|w=s")) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
485 die "\nTo get a list of valid options and their values, use \"$ScriptName -h\" or\n\"perl -S $ScriptName -h\" command and try again...\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
486 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
487 if ($Options{workingdir}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
488 if (! -d $Options{workingdir}) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
489 die "Error: The value specified, $Options{workingdir}, for option \"-w --workingdir\" is not a directory name.\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
490 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
491 chdir $Options{workingdir} or die "Error: Couldn't chdir $Options{workingdir}: $! \n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
492 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
493 if ($Options{colmode} !~ /^(ColNum|ColLabel)$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
494 die "Error: The value specified, $Options{colmode}, for option \"-c, --ColMode\" is not valid. Allowed values: ColNum, or ColLabel\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
495 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
496 if (!IsPositiveInteger($Options{detail})) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
497 die "Error: The value specified, $Options{detail}, for option \"-d, --detail\" is not valid. Allowed values: > 0 \n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
498 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
499 if ($Options{indelim} !~ /^(comma|semicolon)$/i) {
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
500 die "Error: The value specified, $Options{indelim}, for option \"--InDelim\" is not valid. Allowed values: comma, or semicolon\n";
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
501 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
502 }
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
503
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
504 __END__
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
505
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
506 =head1 NAME
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
507
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
508 InfoFingerprintsFiles.pl - List information about fingerprints data in SD, FP and CSV/TSV text file(s)
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
509
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
510 =head1 SYNOPSIS
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
511
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
512 InfoFingerprintsFiles.pl SDFile(s) FPFile(s) TextFile(s)...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
513
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
514 InfoFingerprintsFiles.pl [B<-a, --all>] [B<--AverageBitDensity>] [B<--BitDensity>]
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
515 [B<-c, --count>] [B<-c, --ColMode> I<ColNum | ColLabel>] [B<--DataCheck>]
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
516 [B<-d, --detail> I<InfoLevel>] [B<-e, --empty>] [B<--FingerprintsCol> I<col number | col name>]
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
517 [B<--FingerprintsField> I<FieldLabel>] [B<--FingerprintsType>] [B<--FingerprintsDescription>]
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
518 [B<--FingerprintsSize>] [B<--FingerprintsBitStringFormat>] [B<--FingerprintsBitOrder>]
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
519 [B<--FingerprintsVectorValuesType>] [B<--FingerprintsVectorValuesFormat>]
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
520 [B<-h, --help>] [B<--InDelim> I<comma | semicolon>]
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
521 [B<--NumOfOnBits>] [B<--NumOfNonZeroValues>]
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
522 [B<-w, --WorkingDir> dirname] SDFile(s) FPFile(s) TextFile(s)...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
523
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
524 =head1 DESCRIPTION
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
525
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
526 List information about fingerprints data in I<SD, FP and CSV/TSV> text file(s): number of
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
527 rows containing fingerprints data, type of fingerprints vector, description and size of fingerprints,
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
528 bit density and average bit density for bit-vector fingerprints strings, and so on.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
529
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
530 The scripts InfoFingerprintsSDFiles.pl and InfoFingerprintsTextFiles.pl have been removed from the
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
531 current release of MayaChemTools and their functionality merged with this script.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
532
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
533 The valid I<SDFile> extensions are I<.sdf> and I<.sd>. All SD files in a current directory
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
534 can be specified either by I<*.sdf> or the current directory name.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
535
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
536 The valid I<FPFile> extensions are I<.fpf> and I<.fp>. All FP files in a current directory
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
537 can be specified either by I<*.fpf> or the current directory name.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
538
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
539 The valid I<TextFile> extensions are I<.csv> and I<.tsv> for comma/semicolon and tab
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
540 delimited text files respectively. All other file names are ignored. All text files in a
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
541 current directory can be specified by I<*.csv>, I<*.tsv>, or the current directory
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
542 name. The B<--indelim> option determines the format of I<TextFile(s)>. Any file
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
543 which doesn't correspond to the format indicated by B<--indelim> option is ignored.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
544
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
545 Format of fingerprint strings data in I<SDFile(s), FPFile(s) and TextFile(s)> is automatically
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
546 detected.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
547
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
548 Example of I<FP> file containing fingerprints bit-vector string data:
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
549
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
550 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
551 # Package = MayaChemTools 7.4
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
552 # ReleaseDate = Oct 21, 2010
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
553 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
554 # TimeStamp = Mon Mar 7 15:14:01 2011
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
555 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
556 # FingerprintsStringType = FingerprintsBitVector
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
557 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
558 # Description = PathLengthBits:AtomicInvariantsAtomTypes:MinLength1:...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
559 # Size = 1024
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
560 # BitStringFormat = HexadecimalString
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
561 # BitsOrder = Ascending
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
562 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
563 Cmpd1 9c8460989ec8a49913991a6603130b0a19e8051c89184414953800cc21510...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
564 Cmpd2 000000249400840040100042011001001980410c000000001010088001120...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
565 ... ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
566 ... ..
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
567
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
568 Example of I<FP> file containing fingerprints vector string data:
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
569
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
570 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
571 # Package = MayaChemTools 7.4
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
572 # ReleaseDate = Oct 21, 2010
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
573 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
574 # TimeStamp = Mon Mar 7 15:14:01 2011
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
575 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
576 # FingerprintsStringType = FingerprintsVector
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
577 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
578 # Description = PathLengthBits:AtomicInvariantsAtomTypes:MinLength1:...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
579 # VectorStringFormat = IDsAndValuesString
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
580 # VectorValuesType = NumericalValues
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
581 #
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
582 Cmpd1 338;C F N O C:C C:N C=O CC CF CN CO C:C:C C:C:N C:CC C:CF C:CN C:
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
583 N:C C:NC CC:N CC=O CCC CCN CCO CNC NC=O O=CO C:C:C:C C:C:C:N C:C:CC...;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
584 33 1 2 5 21 2 2 12 1 3 3 20 2 10 2 2 1 2 2 2 8 2 5 1 1 1 19 2 8 2 2 2 2
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
585 6 2 2 2 2 2 2 2 2 3 2 2 1 4 1 5 1 1 18 6 2 2 1 2 10 2 1 2 1 2 2 2 2 ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
586 Cmpd2 103;C N O C=N C=O CC CN CO CC=O CCC CCN CCO CNC N=CN NC=O NCN O=C
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
587 O C CC=O CCCC CCCN CCCO CCNC CNC=N CNC=O CNCN CCCC=O CCCCC CCCCN CC...;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
588 15 4 4 1 2 13 5 2 2 15 5 3 2 2 1 1 1 2 17 7 6 5 1 1 1 2 15 8 5 7 2 2 2 2
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
589 1 2 1 1 3 15 7 6 8 3 4 4 3 2 2 1 2 3 14 2 4 7 4 4 4 4 1 1 1 2 1 1 1 ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
590 ... ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
591 ... ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
592
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
593 Example of I<SD> file containing fingerprints bit-vector string data:
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
594
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
595 ... ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
596 ... ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
597 $$$$
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
598 ... ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
599 ... ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
600 ... ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
601 41 44 0 0 0 0 0 0 0 0999 V2000
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
602 -3.3652 1.4499 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
603 ... ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
604 2 3 1 0 0 0 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
605 ... ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
606 M END
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
607 > <CmpdID>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
608 Cmpd1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
609
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
610 > <PathLengthFingerprints>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
611 FingerprintsBitVector;PathLengthBits:AtomicInvariantsAtomTypes:MinLengt
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
612 h1:MaxLength8;1024;HexadecimalString;Ascending;9c8460989ec8a49913991a66
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
613 03130b0a19e8051c89184414953800cc2151082844a201042800130860308e8204d4028
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
614 00831048940e44281c00060449a5000ac80c894114e006321264401600846c050164462
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
615 08190410805000304a10205b0100e04c0038ba0fad0209c0ca8b1200012268b61c0026a
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
616 aa0660a11014a011d46
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
617
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
618 $$$$
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
619 ... ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
620 ... ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
621
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
622 Example of CSV I<Text> file containing fingerprints bit-vector string data:
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
623
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
624 "CompoundID","PathLengthFingerprints"
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
625 "Cmpd1","FingerprintsBitVector;PathLengthBits:AtomicInvariantsAtomTypes
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
626 :MinLength1:MaxLength8;1024;HexadecimalString;Ascending;9c8460989ec8a4
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
627 9913991a6603130b0a19e8051c89184414953800cc2151082844a20104280013086030
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
628 8e8204d402800831048940e44281c00060449a5000ac80c894114e006321264401..."
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
629 ... ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
630 ... ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
631
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
632 The current release of MayaChemTools supports the following types of fingerprint
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
633 bit-vector and vector strings:
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
634
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
635 FingerprintsVector;AtomNeighborhoods:AtomicInvariantsAtomTypes:MinRadi
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
636 us0:MaxRadius2;41;AlphaNumericalValues;ValuesString;NR0-C.X1.BO1.H3-AT
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
637 C1:NR1-C.X3.BO3.H1-ATC1:NR2-C.X1.BO1.H3-ATC1:NR2-C.X3.BO4-ATC1 NR0-C.X
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
638 1.BO1.H3-ATC1:NR1-C.X3.BO3.H1-ATC1:NR2-C.X1.BO1.H3-ATC1:NR2-C.X3.BO4-A
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
639 TC1 NR0-C.X2.BO2.H2-ATC1:NR1-C.X2.BO2.H2-ATC1:NR1-C.X3.BO3.H1-ATC1:NR2
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
640 -C.X2.BO2.H2-ATC1:NR2-N.X3.BO3-ATC1:NR2-O.X1.BO1.H1-ATC1 NR0-C.X2.B...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
641
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
642 FingerprintsVector;AtomTypesCount:AtomicInvariantsAtomTypes:ArbitraryS
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
643 ize;10;NumericalValues;IDsAndValuesString;C.X1.BO1.H3 C.X2.BO2.H2 C.X2
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
644 .BO3.H1 C.X3.BO3.H1 C.X3.BO4 F.X1.BO1 N.X2.BO2.H1 N.X3.BO3 O.X1.BO1.H1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
645 O.X1.BO2;2 4 14 3 10 1 1 1 3 2
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
646
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
647 FingerprintsVector;AtomTypesCount:SLogPAtomTypes:ArbitrarySize;16;Nume
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
648 ricalValues;IDsAndValuesString;C1 C10 C11 C14 C18 C20 C21 C22 C5 CS F
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
649 N11 N4 O10 O2 O9;5 1 1 1 14 4 2 1 2 2 1 1 1 1 3 1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
650
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
651 FingerprintsVector;AtomTypesCount:SLogPAtomTypes:FixedSize;67;OrderedN
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
652 umericalValues;IDsAndValuesString;C1 C2 C3 C4 C5 C6 C7 C8 C9 C10 C11 C
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
653 12 C13 C14 C15 C16 C17 C18 C19 C20 C21 C22 C23 C24 C25 C26 C27 CS N1 N
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
654 2 N3 N4 N5 N6 N7 N8 N9 N10 N11 N12 N13 N14 NS O1 O2 O3 O4 O5 O6 O7 O8
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
655 O9 O10 O11 O12 OS F Cl Br I Hal P S1 S2 S3 Me1 Me2;5 0 0 0 2 0 0 0 0 1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
656 1 0 0 1 0 0 0 14 0 4 2 1 0 0 0 0 0 2 0 0 0 1 0 0 0 0 0 0 1 0 0 0 0...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
657
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
658 FingerprintsVector;EStateIndicies:ArbitrarySize;11;NumericalValues;IDs
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
659 AndValuesString;SaaCH SaasC SaasN SdO SdssC SsCH3 SsF SsOH SssCH2 SssN
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
660 H SsssCH;24.778 4.387 1.993 25.023 -1.435 3.975 14.006 29.759 -0.073 3
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
661 .024 -2.270
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
662
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
663 FingerprintsVector;EStateIndicies:FixedSize;87;OrderedNumericalValues;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
664 ValuesString;0 0 0 0 0 0 0 3.975 0 -0.073 0 0 24.778 -2.270 0 0 -1.435
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
665 4.387 0 0 0 0 0 0 3.024 0 0 0 0 0 0 0 1.993 0 29.759 25.023 0 0 0 0 1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
666 4.006 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
667 0 0 0 0 0 0 0 0 0 0 0 0 0 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
668
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
669 FingerprintsVector;ExtendedConnectivity:AtomicInvariantsAtomTypes:Radi
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
670 us2;60;AlphaNumericalValues;ValuesString;73555770 333564680 352413391
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
671 666191900 1001270906 1371674323 1481469939 1977749791 2006158649 21414
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
672 08799 49532520 64643108 79385615 96062769 273726379 564565671 85514103
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
673 5 906706094 988546669 1018231313 1032696425 1197507444 1331250018 1338
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
674 532734 1455473691 1607485225 1609687129 1631614296 1670251330 17303...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
675
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
676 FingerprintsVector;ExtendedConnectivityCount:AtomicInvariantsAtomTypes
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
677 :Radius2;60;NumericalValues;IDsAndValuesString;73555770 333564680 3524
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
678 13391 666191900 1001270906 1371674323 1481469939 1977749791 2006158649
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
679 2141408799 49532520 64643108 79385615 96062769 273726379 564565671...;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
680 3 2 1 1 14 1 2 10 4 3 1 1 1 1 2 1 2 1 1 1 2 3 1 1 2 1 3 3 8 2 2 2 6 2
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
681 1 2 1 1 2 1 1 1 2 1 1 2 1 2 1 1 1 1 1 1 1 1 1 2 1 1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
682
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
683 FingerprintsBitVector;ExtendedConnectivityBits:AtomicInvariantsAtomTyp
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
684 es:Radius2;1024;BinaryString;Ascending;0000000000000000000000000000100
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
685 0000000001010000000110000011000000000000100000000000000000000000100001
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
686 1000000110000000000000000000000000010011000000000000000000000000010000
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
687 0000000000000000000000000010000000000000000001000000000000000000000000
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
688 0000000000010000100001000000000000101000000000000000100000000000000...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
689
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
690 FingerprintsVector;ExtendedConnectivity:FunctionalClassAtomTypes:Radiu
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
691 s2;57;AlphaNumericalValues;ValuesString;24769214 508787397 850393286 8
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
692 62102353 981185303 1231636850 1649386610 1941540674 263599683 32920567
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
693 1 571109041 639579325 683993318 723853089 810600886 885767127 90326012
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
694 7 958841485 981022393 1126908698 1152248391 1317567065 1421489994 1455
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
695 632544 1557272891 1826413669 1983319256 2015750777 2029559552 20404...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
696
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
697 FingerprintsVector;ExtendedConnectivity:EStateAtomTypes:Radius2;62;Alp
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
698 haNumericalValues;ValuesString;25189973 528584866 662581668 671034184
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
699 926543080 1347067490 1738510057 1759600920 2034425745 2097234755 21450
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
700 44754 96779665 180364292 341712110 345278822 386540408 387387308 50430
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
701 1706 617094135 771528807 957666640 997798220 1158349170 1291258082 134
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
702 1138533 1395329837 1420277211 1479584608 1486476397 1487556246 1566...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
703
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
704 FingerprintsBitVector;MACCSKeyBits;166;BinaryString;Ascending;00000000
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
705 0000000000000000000000000000000001001000010010000000010010000000011100
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
706 0100101010111100011011000100110110000011011110100110111111111111011111
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
707 11111111111110111000
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
708
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
709 FingerprintsBitVector;MACCSKeyBits;322;BinaryString;Ascending;11101011
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
710 1110011111100101111111000111101100110000000000000011100010000000000000
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
711 0000000000000000000000000000000000000000000000101000000000000000000000
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
712 0000000000000000000000000000000000000000000000000000000000000000000000
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
713 0000000000000000000000000000000000000011000000000000000000000000000000
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
714 0000000000000000000000000000000000000000
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
715
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
716 FingerprintsVector;MACCSKeyCount;166;OrderedNumericalValues;ValuesStri
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
717 ng;0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
718 0 0 0 0 0 0 0 1 0 0 3 0 0 0 0 4 0 0 2 0 0 0 0 0 0 0 0 2 0 0 2 0 0 0 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
719 0 0 0 0 1 1 8 0 0 0 1 0 0 1 0 1 0 1 0 3 1 3 1 0 0 0 1 2 0 11 1 0 0 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
720 5 0 0 1 2 0 1 1 0 0 0 0 0 1 1 0 1 1 1 1 0 4 0 0 1 1 0 4 6 1 1 1 2 1 1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
721 3 5 2 2 0 5 3 5 1 1 2 5 1 2 1 2 4 8 3 5 5 2 2 0 3 5 4 1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
722
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
723 FingerprintsVector;MACCSKeyCount;322;OrderedNumericalValues;ValuesStri
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
724 ng;14 8 2 0 2 0 4 4 2 1 4 0 0 2 5 10 5 2 1 0 0 2 0 5 13 3 28 5 5 3 0 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
725 0 4 2 1 1 0 1 1 0 0 2 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 22 5 3 0 0 0 1 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
726 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
727 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 11 0 2 0 0 0 0 0 0 0 0 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
728 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
729
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
730 FingerprintsBitVector;PathLengthBits:AtomicInvariantsAtomTypes:MinLeng
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
731 th1:MaxLength8;1024;BinaryString;Ascending;001000010011010101011000110
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
732 0100010101011000101001011100110001000010001001101000001001001001001000
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
733 0010110100000111001001000001001010100100100000000011000000101001011100
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
734 0010000001000101010100000100111100110111011011011000000010110111001101
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
735 0101100011000000010001000011000010100011101100001000001000100000000...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
736
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
737 FingerprintsVector;PathLengthCount:AtomicInvariantsAtomTypes:MinLength
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
738 1:MaxLength8;432;NumericalValues;IDsAndValuesPairsString;C.X1.BO1.H3 2
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
739 C.X2.BO2.H2 4 C.X2.BO3.H1 14 C.X3.BO3.H1 3 C.X3.BO4 10 F.X1.BO1 1 N.X
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
740 2.BO2.H1 1 N.X3.BO3 1 O.X1.BO1.H1 3 O.X1.BO2 2 C.X1.BO1.H3C.X3.BO3.H1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
741 2 C.X2.BO2.H2C.X2.BO2.H2 1 C.X2.BO2.H2C.X3.BO3.H1 4 C.X2.BO2.H2C.X3.BO
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
742 4 1 C.X2.BO2.H2N.X3.BO3 1 C.X2.BO3.H1:C.X2.BO3.H1 10 C.X2.BO3.H1:C....
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
743
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
744 FingerprintsVector;PathLengthCount:MMFF94AtomTypes:MinLength1:MaxLengt
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
745 h8;463;NumericalValues;IDsAndValuesPairsString;C5A 2 C5B 2 C=ON 1 CB 1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
746 8 COO 1 CR 9 F 1 N5 1 NC=O 1 O=CN 1 O=CO 1 OC=O 1 OR 2 C5A:C5B 2 C5A:N
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
747 5 2 C5ACB 1 C5ACR 1 C5B:C5B 1 C5BC=ON 1 C5BCB 1 C=ON=O=CN 1 C=ONNC=O 1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
748 CB:CB 18 CBF 1 CBNC=O 1 COO=O=CO 1 COOCR 1 COOOC=O 1 CRCR 7 CRN5 1 CR
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
749 OR 2 C5A:C5B:C5B 2 C5A:C5BC=ON 1 C5A:C5BCB 1 C5A:N5:C5A 1 C5A:N5CR ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
750
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
751 FingerprintsVector;TopologicalAtomPairs:AtomicInvariantsAtomTypes:MinD
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
752 istance1:MaxDistance10;223;NumericalValues;IDsAndValuesString;C.X1.BO1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
753 .H3-D1-C.X3.BO3.H1 C.X2.BO2.H2-D1-C.X2.BO2.H2 C.X2.BO2.H2-D1-C.X3.BO3.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
754 H1 C.X2.BO2.H2-D1-C.X3.BO4 C.X2.BO2.H2-D1-N.X3.BO3 C.X2.BO3.H1-D1-...;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
755 2 1 4 1 1 10 8 1 2 6 1 2 2 1 2 1 2 2 1 2 1 5 1 10 12 2 2 1 2 1 9 1 3 1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
756 1 1 2 2 1 3 6 1 6 14 2 2 2 3 1 3 1 8 2 2 1 3 2 6 1 2 2 5 1 3 1 23 1...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
757
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
758 FingerprintsVector;TopologicalAtomPairs:FunctionalClassAtomTypes:MinDi
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
759 stance1:MaxDistance10;144;NumericalValues;IDsAndValuesString;Ar-D1-Ar
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
760 Ar-D1-Ar.HBA Ar-D1-HBD Ar-D1-Hal Ar-D1-None Ar.HBA-D1-None HBA-D1-NI H
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
761 BA-D1-None HBA.HBD-D1-NI HBA.HBD-D1-None HBD-D1-None NI-D1-None No...;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
762 23 2 1 1 2 1 1 1 1 2 1 1 7 28 3 1 3 2 8 2 1 1 1 5 1 5 24 3 3 4 2 13 4
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
763 1 1 4 1 5 22 4 4 3 1 19 1 1 1 1 1 2 2 3 1 1 8 25 4 5 2 3 1 26 1 4 1 ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
764
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
765 FingerprintsVector;TopologicalAtomTorsions:AtomicInvariantsAtomTypes;3
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
766 3;NumericalValues;IDsAndValuesString;C.X1.BO1.H3-C.X3.BO3.H1-C.X3.BO4-
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
767 C.X3.BO4 C.X1.BO1.H3-C.X3.BO3.H1-C.X3.BO4-N.X3.BO3 C.X2.BO2.H2-C.X2.BO
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
768 2.H2-C.X3.BO3.H1-C.X2.BO2.H2 C.X2.BO2.H2-C.X2.BO2.H2-C.X3.BO3.H1-O...;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
769 2 2 1 1 2 2 1 1 3 4 4 8 4 2 2 6 2 2 1 2 1 1 2 1 1 2 6 2 4 2 1 3 1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
770
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
771 FingerprintsVector;TopologicalAtomTorsions:EStateAtomTypes;36;Numerica
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
772 lValues;IDsAndValuesString;aaCH-aaCH-aaCH-aaCH aaCH-aaCH-aaCH-aasC aaC
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
773 H-aaCH-aasC-aaCH aaCH-aaCH-aasC-aasC aaCH-aaCH-aasC-sF aaCH-aaCH-aasC-
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
774 ssNH aaCH-aasC-aasC-aasC aaCH-aasC-aasC-aasN aaCH-aasC-ssNH-dssC a...;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
775 4 4 8 4 2 2 6 2 2 2 4 3 2 1 3 3 2 2 2 1 2 1 1 1 2 1 1 1 1 1 1 1 2 1 1 2
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
776
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
777 FingerprintsVector;TopologicalAtomTriplets:AtomicInvariantsAtomTypes:M
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
778 inDistance1:MaxDistance10;3096;NumericalValues;IDsAndValuesString;C.X1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
779 .BO1.H3-D1-C.X1.BO1.H3-D1-C.X3.BO3.H1-D2 C.X1.BO1.H3-D1-C.X2.BO2.H2-D1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
780 0-C.X3.BO4-D9 C.X1.BO1.H3-D1-C.X2.BO2.H2-D3-N.X3.BO3-D4 C.X1.BO1.H3-D1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
781 -C.X2.BO2.H2-D4-C.X2.BO2.H2-D5 C.X1.BO1.H3-D1-C.X2.BO2.H2-D6-C.X3....;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
782 1 2 2 2 2 2 2 2 8 8 4 8 4 4 2 2 2 2 4 2 2 2 4 2 2 2 2 1 2 2 4 4 4 2 2
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
783 2 4 4 4 8 4 4 2 4 4 4 2 4 4 2 2 2 2 2 2 2 2 1 2 2 2 2 2 2 2 2 2 2 8...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
784
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
785 FingerprintsVector;TopologicalAtomTriplets:SYBYLAtomTypes:MinDistance1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
786 :MaxDistance10;2332;NumericalValues;IDsAndValuesString;C.2-D1-C.2-D9-C
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
787 .3-D10 C.2-D1-C.2-D9-C.ar-D10 C.2-D1-C.3-D1-C.3-D2 C.2-D1-C.3-D10-C.3-
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
788 D9 C.2-D1-C.3-D2-C.3-D3 C.2-D1-C.3-D2-C.ar-D3 C.2-D1-C.3-D3-C.3-D4 C.2
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
789 -D1-C.3-D3-N.ar-D4 C.2-D1-C.3-D3-O.3-D2 C.2-D1-C.3-D4-C.3-D5 C.2-D1-C.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
790 3-D5-C.3-D6 C.2-D1-C.3-D5-O.3-D4 C.2-D1-C.3-D6-C.3-D7 C.2-D1-C.3-D7...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
791
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
792 FingerprintsVector;TopologicalPharmacophoreAtomPairs:ArbitrarySize:Min
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
793 Distance1:MaxDistance10;54;NumericalValues;IDsAndValuesString;H-D1-H H
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
794 -D1-NI HBA-D1-NI HBD-D1-NI H-D2-H H-D2-HBA H-D2-HBD HBA-D2-HBA HBA-D2-
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
795 HBD H-D3-H H-D3-HBA H-D3-HBD H-D3-NI HBA-D3-NI HBD-D3-NI H-D4-H H-D4-H
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
796 BA H-D4-HBD HBA-D4-HBA HBA-D4-HBD HBD-D4-HBD H-D5-H H-D5-HBA H-D5-...;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
797 18 1 2 1 22 12 8 1 2 18 6 3 1 1 1 22 13 6 5 7 2 28 9 5 1 1 1 36 16 10
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
798 3 4 1 37 10 8 1 35 10 9 3 3 1 28 7 7 4 18 16 12 5 1 2 1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
799
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
800 FingerprintsVector;TopologicalPharmacophoreAtomPairs:FixedSize:MinDist
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
801 ance1:MaxDistance10;150;OrderedNumericalValues;ValuesString;18 0 0 1 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
802 0 0 2 0 0 1 0 0 0 0 22 12 8 0 0 1 2 0 0 0 0 0 0 0 0 18 6 3 1 0 0 0 1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
803 0 0 1 0 0 0 0 22 13 6 0 0 5 7 0 0 2 0 0 0 0 0 28 9 5 1 0 0 0 1 0 0 1 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
804 0 0 0 36 16 10 0 0 3 4 0 0 1 0 0 0 0 0 37 10 8 0 0 0 0 1 0 0 0 0 0 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
805 0 35 10 9 0 0 3 3 0 0 1 0 0 0 0 0 28 7 7 4 0 0 0 0 0 0 0 0 0 0 0 18...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
806
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
807 FingerprintsVector;TopologicalPharmacophoreAtomTriplets:ArbitrarySize:
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
808 MinDistance1:MaxDistance10;696;NumericalValues;IDsAndValuesString;Ar1-
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
809 Ar1-Ar1 Ar1-Ar1-H1 Ar1-Ar1-HBA1 Ar1-Ar1-HBD1 Ar1-H1-H1 Ar1-H1-HBA1 Ar1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
810 -H1-HBD1 Ar1-HBA1-HBD1 H1-H1-H1 H1-H1-HBA1 H1-H1-HBD1 H1-HBA1-HBA1 H1-
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
811 HBA1-HBD1 H1-HBA1-NI1 H1-HBD1-NI1 HBA1-HBA1-NI1 HBA1-HBD1-NI1 Ar1-...;
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
812 46 106 8 3 83 11 4 1 21 5 3 1 2 2 1 1 1 100 101 18 11 145 132 26 14 23
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
813 28 3 3 5 4 61 45 10 4 16 20 7 5 1 3 4 5 3 1 1 1 1 5 4 2 1 2 2 2 1 1 1
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
814 119 123 24 15 185 202 41 25 22 17 3 5 85 95 18 11 23 17 3 1 1 6 4 ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
815
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
816 FingerprintsVector;TopologicalPharmacophoreAtomTriplets:FixedSize:MinD
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
817 istance1:MaxDistance10;2692;OrderedNumericalValues;ValuesString;46 106
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
818 8 3 0 0 83 11 4 0 0 0 1 0 0 0 0 0 0 0 0 21 5 3 0 0 1 2 2 0 0 1 0 0 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
819 0 0 0 1 0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 100 101 18 11 0 0 145 132 26
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
820 14 0 0 23 28 3 3 0 0 5 4 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 61 45 10 4 0
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
821 0 16 20 7 5 1 0 3 4 5 3 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 1 1 0 0 5 ...
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
822
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
823 =head1 OPTIONS
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
824
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
825 =over 4
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
826
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
827 =item B<-a, --all>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
828
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
829 List all the available information.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
830
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
831 =item B<--AverageBitDensity>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
832
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
833 List average bit density of fingerprint bit-vector strings.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
834
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
835 =item B<--BitDensity>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
836
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
837 List bit density of fingerprints bit-vector strings data in each row.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
838
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
839 =item B<--count>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
840
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
841 List number of data entries containing fingerprints bit-vector or vector strings data. This
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
842 is B<default behavior>.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
843
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
844 =item B<-c, --ColMode> I<ColNum | ColLabel>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
845
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
846 Specify how columns are identified in CSV/TSV I<TextFile(s)>: using column number or column
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
847 label. Possible values: I<ColNum or ColLabel>. Default value: I<ColNum>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
848
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
849 =item B<-d, --detail> I<InfoLevel>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
850
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
851 Level of information to print about lines being ignored. Default: I<1>. Possible values:
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
852 I<1, 2 or 3>.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
853
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
854 =item B<--DataCheck>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
855
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
856 Validate fingerprints data specified using B<--FingerprintsCol> and list information
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
857 about missing and invalid data.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
858
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
859 =item B<-e, --empty>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
860
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
861 List number of rows containing no fingerprints data.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
862
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
863 =item B<--FingerprintsCol> I<col number | col name>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
864
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
865 This value is B<-c, --colmode> specific. It corresponds to column in CSV/TSV I<TextFile(s)>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
866 containing fingerprints data. Possible values: I<col number or col label>.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
867 Default value: I<first column containing the word Fingerprints in its column label>.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
868
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
869 =item B<--FingerprintsField> I<FieldLabel>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
870
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
871 Fingerprints field label to use during listing of fingerprints information for I<SDFile(s)>.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
872 Default value: I<first data field label containing the word Fingerprints in its label>.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
873
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
874 =item B<--FingerprintsType>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
875
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
876 List types of fingerprint strings: FingerprintsBitVector or FingerprintsVector.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
877
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
878 =item B<--FingerprintsDescription>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
879
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
880 List types of fingerprints: PathLengthBits, PathLengthCount, MACCSKeyCount,
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
881 ExtendedConnectivity and so on.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
882
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
883 =item B<--FingerprintsSize>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
884
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
885 List size of fingerprints.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
886
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
887 =item B<--FingerprintsBitStringFormat>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
888
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
889 List format of fingerprint bit-vector strings: BinaryString or HexadecimalString.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
890
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
891 =item B<--FingerprintsBitOrder>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
892
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
893 List order of bits data in fingerprint bit-vector bit strings: Ascending or Descending.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
894
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
895 =item B<--FingerprintsVectorValuesType>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
896
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
897 List type of values in fingerprint vector strings: OrderedNumericalValues, NumericalValues or
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
898 AlphaNumericalValues.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
899
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
900 =item B<--FingerprintsVectorValuesFormat>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
901
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
902 List format of values in fingerprint vector strings: ValuesString, IDsAndValuesString,
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
903 IDsAndValuesPairsString, ValuesAndIDsString or ValuesAndIDsPairsString.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
904
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
905 =item B<-h, --help>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
906
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
907 Print this help message.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
908
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
909 =item B<--InDelim> I<comma | semicolon>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
910
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
911 Input delimiter for CSV I<TextFile(s)>. Possible values: I<comma or semicolon>.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
912 Default value: I<comma>. For TSV files, this option is ignored and I<tab> is used as a
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
913 delimiter.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
914
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
915 =item B<--NumOfOnBits>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
916
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
917 List number of on bits in fingerprints bit-vector strings data in each row.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
918
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
919 =item B<--NumOfNonZeroValues>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
920
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
921 List number of non-zero values in fingerprints vector strings data in each row.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
922
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
923 =item B<-w, --WorkingDir> I<DirName>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
924
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
925 Location of working directory. Default: current directory.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
926
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
927 =back
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
928
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
929 =head1 EXAMPLES
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
930
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
931 To count number of lines containing fingerprints bit-vector or vector strings data present
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
932 in FP file, in a column name containing Fingerprint substring in text file, and in a data
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
933 field with Fingerprint substring in its label, type:
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
934
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
935 % InfoFingerprintsFiles.pl SampleFPBin.csv
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
936
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
937 % InfoFingerprintsFiles.pl SampleFPBin.sdf SampleFPBin.fpf
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
938 SampleFPBin.csv
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
939
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
940 % InfoFingerprintsFiles.pl SampleFPHex.sdf SampleFPHex.fpf
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
941 SampleFPHex.csv
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
942
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
943 % InfoFingerprintsFiles.pl SampleFPcount.sdf SampleFPcount.fpf
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
944 SampleFPcount.csv
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
945
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
946 To list all available information about fingerprints bit-vector or vector strings data present
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
947 in FP file, in a column name containing Fingerprint substring in text file, and in a data
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
948 field with Fingerprint substring in its label, type:
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
949
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
950 % InfoFingerprintsFiles.pl -a SampleFPHex.sdf SampleFPHex.fpf
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
951 SampleFPHex.csv
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
952
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
953 % InfoFingerprintsFiles.pl -a SampleFPcount.sdf SampleFPcount.fpf
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
954 SampleFPcount.csv
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
955
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
956 To list all available information about fingerprints bit-vector or vector strings data present in a
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
957 column named Fingerprints in text file, type:
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
958
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
959 % InfoFingerprintsFiles.pl -a --ColMode ColLabel --FingerprintsCol
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
960 Fingerprints SampleFPHex.sdf
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
961
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
962 % InfoFingerprintsFiles.pl -a --ColMode ColLabel --FingerprintsCol
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
963 Fingerprints SampleFPcount.csv
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
964
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
965 To list all available information about fingerprints bit-vector or vector strings data present in a
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
966 data field names Fingerprints in SD file, type:
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
967
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
968 % InfoFingerprintsFiles.pl -a --FingerprintsField Fingerprints
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
969 SampleFPHex.sdf
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
970
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
971 % InfoFingerprintsFiles.pl -a --FingerprintsField Fingerprints
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
972 SampleFPcount.sdf
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
973
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
974 To list bit density, average bit density, and number of on bits for fingerprints bit-vector strings data
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
975 present in FP file, in a column name containing Fingerprint substring in text file, and in a data
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
976 field with Fingerprint substring in its label, type:
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
977
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
978 % InfoFingerprintsFiles.pl --BitDensity --AverageBitDensity
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
979 --NumOfOnBits SampleFPBin.csv SampleFPBin.sdf SampleFPBin.fpf
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
980
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
981 To list vector values type, format and number of non-zero values for fingerprints vector strings
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
982 data present in FP file, in a column name containing Fingerprint substring in text file, and in a data
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
983 field with Fingerprint substring in its label along with fingerprints type and description, type:
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
984
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
985 % InfoFingerprintsFiles.pl --FingerprintsType --FingerprintsDescription
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
986 --FingerprintsVectorValuesType --FingerprintsVectorValuesFormat
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
987 --NumOfNonZeroValues SampleFPcount.csv SampleFPcount.sdf
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
988 SampleFPcount.fpf
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
989
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
990 =head1 AUTHOR
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
991
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
992 Manish Sud <msud@san.rr.com>
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
993
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
994 =head1 SEE ALSO
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
995
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
996 SimilarityMatricesFingerprints.pl, SimilaritySearchingFingerprints.pl, AtomNeighborhoodsFingerprints.pl,
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
997 AtomNeighborhoodsFingerprints.pl, ExtendedConnectivityFingerprints.pl, MACCSKeysFingerprints.pl,
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
998 PathLengthFingerprints.pl, TopologicalAtomPairsFingerprints.pl, TopologicalAtomTorsionsFingerprints.pl,
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
999 TopologicalPharmacophoreAtomPairsFingerprints.pl, TopologicalPharmacophoreAtomTripletsFingerprints.pl
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
1000
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
1001 =head1 COPYRIGHT
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
1002
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
1003 Copyright (C) 2015 Manish Sud. All rights reserved.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
1004
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
1005 This file is part of MayaChemTools.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
1006
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
1007 MayaChemTools is free software; you can redistribute it and/or modify it under
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
1008 the terms of the GNU Lesser General Public License as published by the Free
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
1009 Software Foundation; either version 3 of the License, or (at your option)
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
1010 any later version.
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
1011
73ae111cf86f Uploaded
deepakjadmin
parents:
diff changeset
1012 =cut