annotate bin/InfoFingerprintsFiles.pl @ 0:4816e4a8ae95 draft default tip

Uploaded
author deepakjadmin
date Wed, 20 Jan 2016 09:23:18 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1 #!/usr/bin/perl -w
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
2 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
3 # $RCSfile: InfoFingerprintsFiles.pl,v $
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
4 # $Date: 2015/02/28 20:46:20 $
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
5 # $Revision: 1.20 $
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
6 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
7 # Author: Manish Sud <msud@san.rr.com>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
8 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
9 # Copyright (C) 2015 Manish Sud. All rights reserved.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
10 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
11 # This file is part of MayaChemTools.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
12 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
13 # MayaChemTools is free software; you can redistribute it and/or modify it under
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
14 # the terms of the GNU Lesser General Public License as published by the Free
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
15 # Software Foundation; either version 3 of the License, or (at your option) any
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
16 # later version.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
17 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
18 # MayaChemTools is distributed in the hope that it will be useful, but without
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
19 # any warranty; without even the implied warranty of merchantability of fitness
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
20 # for a particular purpose. See the GNU Lesser General Public License for more
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
21 # details.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
22 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
23 # You should have received a copy of the GNU Lesser General Public License
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
24 # along with MayaChemTools; if not, see <http://www.gnu.org/licenses/> or
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
25 # write to the Free Software Foundation Inc., 59 Temple Place, Suite 330,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
26 # Boston, MA, 02111-1307, USA.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
27 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
28
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
29 use strict;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
30 use FindBin; use lib "$FindBin::Bin/../lib";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
31 use Getopt::Long;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
32 use File::Basename;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
33 use Text::ParseWords;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
34 use Benchmark;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
35 use FileUtil;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
36 use TextUtil;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
37 use Fingerprints::FingerprintsFileUtil;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
38 use Fingerprints::FingerprintsStringUtil;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
39
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
40 my($ScriptName, %Options, $StartTime, $EndTime, $TotalTime);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
41
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
42 # Autoflush STDOUT
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
43 $| = 1;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
44
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
45 # Starting message...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
46 $ScriptName = basename($0);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
47 print "\n$ScriptName: Starting...\n\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
48 $StartTime = new Benchmark;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
49
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
50 # Get the options and setup script...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
51 SetupScriptUsage();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
52 if ($Options{help} || @ARGV < 1) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
53 die GetUsageFromPod("$FindBin::Bin/$ScriptName");
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
54 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
55
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
56 my(@FingerprintsFilesList);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
57 @FingerprintsFilesList = ExpandFileNames(\@ARGV, "sdf sd fpf fp csv tsv");
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
58
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
59 # Process options...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
60 print "Processing options...\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
61 my(%OptionsInfo);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
62 ProcessOptions();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
63
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
64 # Setup information about input files...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
65 print "Checking input fingerprints file(s)...\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
66 my(%FingerprintsFilesInfo);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
67 RetrieveFingerprintsFilesInfo();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
68
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
69 # Process input files..
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
70 my($FileIndex);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
71 if (@FingerprintsFilesList > 1) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
72 print "\nProcessing fingerprints files...\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
73 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
74 for $FileIndex (0 .. $#FingerprintsFilesList) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
75 if ($FingerprintsFilesInfo{FileOkay}[$FileIndex]) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
76 print "\nProcessing file $FingerprintsFilesList[$FileIndex]...\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
77 ListFingerprintsFileInfo($FileIndex);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
78 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
79 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
80 ListTotalSizeOfFiles();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
81
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
82 print "\n$ScriptName:Done...\n\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
83
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
84 $EndTime = new Benchmark;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
85 $TotalTime = timediff ($EndTime, $StartTime);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
86 print "Total time: ", timestr($TotalTime), "\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
87
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
88 ###############################################################################
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
89
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
90 # List approptiate information...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
91 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
92 sub ListFingerprintsFileInfo {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
93 my($FileIndex) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
94 my($FileName, $FingerprintsFileIO, $InvalidFingerprintsFileData, $InvalidFingerprintsData, $DataEntryCount, $ValidDataEntryCount, $InvalidDataEntryCount, $MissingDataEntryCount, $BitVectorDataEntryCount, $VectorDataEntryCount, $FingerprintsObject, $FingerprintsType, $TotalBitDensity, $FileType, $DataEntryLabel);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
95
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
96 $FileType = $FingerprintsFilesInfo{FileType}[$FileIndex];
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
97 $DataEntryLabel = ($FileType =~ /^SD$/i) ? 'compounds' : 'lines';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
98
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
99 ($DataEntryCount, $ValidDataEntryCount, $InvalidDataEntryCount, $MissingDataEntryCount, $BitVectorDataEntryCount, $VectorDataEntryCount, $TotalBitDensity) = (0) x 7;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
100
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
101 $FingerprintsFileIO = Fingerprints::FingerprintsFileUtil::NewFingerprintsFileIO(%{$FingerprintsFilesInfo{FingerprintsFileIOParameters}[$FileIndex]});
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
102 $FingerprintsFileIO->Open();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
103
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
104 $InvalidFingerprintsFileData = $FingerprintsFileIO->IsFingerprintsFileDataValid() ? 0 : 1;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
105
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
106 FINGERPRINTS: while ($FingerprintsFileIO->Read()) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
107 $DataEntryCount++;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
108
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
109 # Missing data...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
110 if ($InvalidFingerprintsFileData) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
111 $MissingDataEntryCount++;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
112 if ($OptionsInfo{ValidateData} || $OptionsInfo{CountEmptyFingerprints}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
113 ListEmptyOrInvalidFingerprintsDataInfo('EmptyData', $FingerprintsFileIO, $FileType);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
114 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
115 next FINGERPRINTS;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
116 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
117 $InvalidFingerprintsData = $FingerprintsFileIO->IsFingerprintsDataValid() ? 0 : 1;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
118
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
119 # Invalid data...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
120 if ($InvalidFingerprintsData) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
121 $InvalidDataEntryCount++;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
122 if ($OptionsInfo{ValidateData}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
123 ListEmptyOrInvalidFingerprintsDataInfo('InvalidData', $FingerprintsFileIO, $FileType);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
124 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
125 next FINGERPRINTS;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
126 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
127 $ValidDataEntryCount++;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
128
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
129 $FingerprintsObject = $FingerprintsFileIO->GetFingerprints();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
130 $FingerprintsType = $FingerprintsObject->GetVectorType();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
131
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
132 if ($FingerprintsType =~ /^FingerprintsBitVector$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
133 $BitVectorDataEntryCount++;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
134 if ($OptionsInfo{ListAverageBitDensity}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
135 $TotalBitDensity += $FingerprintsObject->GetFingerprintsBitDensity();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
136 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
137 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
138 elsif ($FingerprintsType =~ /^FingerprintsVector$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
139 $VectorDataEntryCount++;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
140 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
141
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
142 if ($OptionsInfo{ListFingerprintsDataEntryInfo}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
143 ListFingerprintsDataEntryInfo($FingerprintsFileIO, $FileType);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
144 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
145
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
146 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
147 $FingerprintsFileIO->Close();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
148
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
149 print "\nFingerprints file type: $FileType\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
150 if ($FileType =~ /^SD$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
151 print "Number of compounds: $DataEntryCount\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
152 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
153 else {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
154 print "Number of data lines: $DataEntryCount\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
155 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
156
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
157 ListFileTypeHeaderInfo($FingerprintsFileIO, $FileType);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
158
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
159 print "\nNumber of $DataEntryLabel with valid fingerprints string data: $ValidDataEntryCount\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
160 print "Number of $DataEntryLabel with bit-vector fingerprints string data: $BitVectorDataEntryCount\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
161 print "Number of $DataEntryLabel with vector fingerprints string data: $VectorDataEntryCount\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
162
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
163 if ($OptionsInfo{CountEmptyFingerprints}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
164 print "Number of $DataEntryLabel with missing fingerprints data: $MissingDataEntryCount\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
165 print "Number of $DataEntryLabel with invalid fingerprints data: $InvalidDataEntryCount\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
166 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
167
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
168 if ($OptionsInfo{ListAverageBitDensity} && $BitVectorDataEntryCount) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
169 my($AverageBitDensity);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
170 $AverageBitDensity = $TotalBitDensity/$BitVectorDataEntryCount;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
171 $AverageBitDensity = sprintf("%.2f", $AverageBitDensity) + 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
172 print "\nAverage bit density: $AverageBitDensity\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
173 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
174
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
175
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
176 # File size and modification information...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
177 print "\nFile size: ", FormatFileSize($FingerprintsFilesInfo{FileSize}[$FileIndex]), " \n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
178 print "Last modified: ", $FingerprintsFilesInfo{FileLastModified}[$FileIndex], " \n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
179 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
180
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
181 # List empty or invalid fingerprints file data information...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
182 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
183 sub ListEmptyOrInvalidFingerprintsDataInfo {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
184 my($Mode, $FingerprintsFileIO, $FileType) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
185 my($ModeInfo);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
186
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
187 $ModeInfo = ($Mode =~ /^EmptyData$/i) ? "no" : "invalid";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
188
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
189 if ($FileType =~ /^SD$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
190 my($CmpdNum, $CmpdString);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
191
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
192 $CmpdNum = $FingerprintsFileIO->GetCompoundNum();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
193 if ($OptionsInfo{DetailLevel} >= 3 ) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
194 $CmpdString = $FingerprintsFileIO->GetCompoundString();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
195 print "Compound number $CmpdNum contains $ModeInfo fingerprints data: $CmpdString \n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
196 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
197 elsif ($OptionsInfo{DetailLevel} >= 1 ) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
198 print "Compound number $CmpdNum contains $ModeInfo fingerprints data...\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
199 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
200 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
201 else {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
202 my($LineNum, $DataLine);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
203
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
204 $LineNum = $FingerprintsFileIO->GetLineNum();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
205 if ($OptionsInfo{DetailLevel} >= 3 ) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
206 $DataLine = $FingerprintsFileIO->GetDataLine();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
207 print "Data line number $LineNum contains $ModeInfo fingerprints data: $DataLine \n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
208 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
209 elsif ($OptionsInfo{DetailLevel} >= 1 ) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
210 print "Data line number $LineNum contains $ModeInfo fingerprints data...\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
211 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
212 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
213 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
214
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
215 # List detailed information about fingerprints data entry...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
216 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
217 sub ListFingerprintsDataEntryInfo {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
218 my($FingerprintsFileIO, $FileType) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
219 my($FingerprintsObject, $FingerprintsString, $FingerprintsType, $FingerprintsDescription, $FingerprintsSize, $FingerprintsBitStringFormat, $FingerprintsBitOrder, $BitDensity, $NumOfOnBits, $FingerprintsVectorValuesType, $FingerprintsVectorValuesFormat, $NumOfNonZeroValues);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
220
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
221 $FingerprintsObject = $FingerprintsFileIO->GetFingerprints();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
222 $FingerprintsString = $FingerprintsFileIO->GetFingerprintsString();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
223
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
224 $FingerprintsType = $FingerprintsObject->GetVectorType();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
225
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
226 if ($FingerprintsType =~ /^FingerprintsBitVector$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
227 $BitDensity = '';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
228 $NumOfOnBits = '';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
229
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
230 ($FingerprintsType, $FingerprintsDescription, $FingerprintsSize, $FingerprintsBitStringFormat, $FingerprintsBitOrder) = Fingerprints::FingerprintsStringUtil::GetFingerprintsStringValues($FingerprintsString);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
231
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
232 if ($OptionsInfo{ListBitDensity} || $OptionsInfo{ListNumOfOnBits}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
233 if ($OptionsInfo{ListBitDensity}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
234 $BitDensity = $FingerprintsObject->GetFingerprintsBitDensity();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
235 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
236 if ($OptionsInfo{ListNumOfOnBits}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
237 $NumOfOnBits = $FingerprintsObject->GetNumOfSetBits();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
238 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
239 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
240 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
241 elsif ($FingerprintsType =~ /^FingerprintsVector$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
242 $NumOfNonZeroValues = '';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
243
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
244 ($FingerprintsType, $FingerprintsDescription, $FingerprintsSize, $FingerprintsVectorValuesType, $FingerprintsVectorValuesFormat) = Fingerprints::FingerprintsStringUtil::GetFingerprintsStringValues($FingerprintsString);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
245
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
246 if ($OptionsInfo{ListNumOfNonZeroValues}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
247 if ($FingerprintsVectorValuesType =~ /^AlphaNumericalValues$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
248 $NumOfNonZeroValues = 'NA';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
249 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
250 else {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
251 $NumOfNonZeroValues = $FingerprintsObject->GetNumOfNonZeroValues();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
252 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
253 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
254 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
255
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
256 if ($FileType =~ /^SD$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
257 print "Compound number: " . $FingerprintsFileIO->GetCompoundNum();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
258 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
259 else {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
260 print "Data line number: " . $FingerprintsFileIO->GetLineNum();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
261 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
262
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
263 if ($OptionsInfo{ListFingerprintsType}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
264 print "; FPType: $FingerprintsType";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
265 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
266 if ($OptionsInfo{ListFingerprintsDescription}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
267 print "; FPDescription: $FingerprintsDescription";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
268 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
269 if ($OptionsInfo{ListFingerprintsSize}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
270 print "; FPSize: $FingerprintsSize";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
271 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
272
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
273 if ($FingerprintsType =~ /^FingerprintsBitVector$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
274 if ($OptionsInfo{ListFingerprintsBitStringFormat}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
275 print "; FPBitStringFormat: $FingerprintsBitStringFormat";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
276 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
277 if ($OptionsInfo{ListFingerprintsBitOrder}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
278 print "; FPBitOrder: $FingerprintsBitOrder";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
279 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
280 if ($OptionsInfo{ListBitDensity}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
281 print "; BitDensity: $BitDensity";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
282 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
283 if ($OptionsInfo{ListNumOfOnBits}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
284 print "; NumOfOnBits: $NumOfOnBits";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
285 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
286 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
287 elsif ($FingerprintsType =~ /^FingerprintsVector$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
288 if ($OptionsInfo{ListFingerprintsVectorValuesType}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
289 print "; FPVectorValuesType: $FingerprintsVectorValuesType";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
290 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
291 if ($OptionsInfo{ListFingerprintsVectorValuesFormat}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
292 print "; FPVectorValuesFormat: $FingerprintsVectorValuesFormat";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
293 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
294 if ($OptionsInfo{ListNumOfNonZeroValues}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
295 print "; NumOfNonZeroValues: $NumOfNonZeroValues";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
296 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
297 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
298 print "\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
299 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
300
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
301 # List file type header information...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
302 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
303 sub ListFileTypeHeaderInfo {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
304 my($FingerprintsFileIO, $FileType) = @_;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
305 my($Key, $Value, @DataColLabels, %HeaderDataKeysAndValues);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
306
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
307 if ($FileType =~ /^Text$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
308 @DataColLabels = $FingerprintsFileIO->GetDataColLabels();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
309 print "Number of columns: " . scalar @DataColLabels . "\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
310 print "Column labels: ", JoinWords(\@DataColLabels, ", ", 1), "\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
311 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
312 elsif ($FileType =~ /^FP$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
313 %HeaderDataKeysAndValues = $FingerprintsFileIO->GetHeaderDataKeysAndValues();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
314
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
315 print "\nFP file header data keys and values: \n#\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
316 for $Key ($FingerprintsFileIO->GetHeaderDataKeys()) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
317 $Value = $HeaderDataKeysAndValues{$Key};
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
318 print "# $Key = $Value\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
319 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
320 print "#\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
321 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
322 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
323
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
324 # Total size of all the fiels...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
325 sub ListTotalSizeOfFiles {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
326 my($FileOkayCount, $TotalSize, $Index);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
327
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
328 $FileOkayCount = 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
329 $TotalSize = 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
330
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
331 for $Index (0 .. $#FingerprintsFilesList) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
332 if ($FingerprintsFilesList[$Index]) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
333 $FileOkayCount++;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
334 $TotalSize += $FingerprintsFilesInfo{FileSize}[$Index];
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
335 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
336 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
337 if ($FileOkayCount > 1) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
338 print "\nTotal size of $FileOkayCount files: ", FormatFileSize($TotalSize), "\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
339 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
340 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
341
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
342 # Retrieve information about fingerprints files...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
343 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
344 sub RetrieveFingerprintsFilesInfo {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
345 my($FingerprintsFile, $Index, $FileDir, $FileExt, $FileName, $FileType, $InDelim, $ModifiedTimeString, $ModifiedDateString, %FingerprintsFileIOParameters);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
346
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
347 %FingerprintsFilesInfo = ();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
348 @{$FingerprintsFilesInfo{FileOkay}} = ();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
349 @{$FingerprintsFilesInfo{FileType}} = ();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
350 @{$FingerprintsFilesInfo{FileSize}} = ();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
351 @{$FingerprintsFilesInfo{FileLastModified}} = ();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
352 @{$FingerprintsFilesInfo{InDelim}} = ();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
353
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
354 @{$FingerprintsFilesInfo{FingerprintsFileIOParameters}} = ();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
355
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
356 FILELIST: for $Index (0 .. $#FingerprintsFilesList) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
357 $FingerprintsFile = $FingerprintsFilesList[$Index];
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
358
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
359 $FingerprintsFilesInfo{FileOkay}[$Index] = 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
360 $FingerprintsFilesInfo{FileType}[$Index] = '';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
361 $FingerprintsFilesInfo{FileSize}[$Index] = 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
362 $FingerprintsFilesInfo{FileLastModified}[$Index] = '';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
363 $FingerprintsFilesInfo{InDelim}[$Index] = "";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
364
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
365 %{$FingerprintsFilesInfo{FingerprintsFileIOParameters}[$Index]} = ();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
366
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
367 $FingerprintsFile = $FingerprintsFilesList[$Index];
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
368 if (!(-e $FingerprintsFile)) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
369 warn "Warning: Ignoring file $FingerprintsFile: It doesn't exist\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
370 next FILELIST;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
371 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
372
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
373 $FileType = Fingerprints::FingerprintsFileUtil::GetFingerprintsFileType($FingerprintsFile);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
374 if (IsEmpty($FileType)) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
375 warn "Warning: Ignoring file $FingerprintsFile: It's not a fingerprints file\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
376 next FILELIST;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
377 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
378
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
379 $FileDir = ""; $FileName = ""; $FileExt = "";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
380 ($FileDir, $FileName, $FileExt) = ParseFileName($FingerprintsFile);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
381
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
382 $InDelim = ($FileExt =~ /^tsv$/i) ? 'Tab' : $OptionsInfo{InDelim};
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
383
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
384 # Setup FingerprintsFileIO parameters...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
385 %FingerprintsFileIOParameters = ();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
386 FILEIOPARAMETERS: {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
387 if ($FileType =~ /^SD$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
388 %FingerprintsFileIOParameters = ('Name' => $FingerprintsFile, 'Mode' => 'Read', 'ValidateData' => $OptionsInfo{ValidateData}, 'DetailLevel' => 1, 'FingerprintsFieldLabel' => $OptionsInfo{FingerprintsFieldLabel});
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
389 last FILEIOPARAMETERS;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
390 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
391 if ($FileType =~ /^FP$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
392 %FingerprintsFileIOParameters = ('Name' => $FingerprintsFile, 'Mode' => 'Read', 'ValidateData' => $OptionsInfo{ValidateData}, 'DetailLevel' => 1);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
393 last FILEIOPARAMETERS;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
394 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
395 if ($FileType =~ /^Text$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
396 %FingerprintsFileIOParameters = ('Name' => $FingerprintsFile, 'Mode' => 'Read', 'ValidateData' => $OptionsInfo{ValidateData}, 'DetailLevel' => 1, 'FingerprintsCol' => $OptionsInfo{FingerprintsCol}, 'ColMode' => $OptionsInfo{ColMode}, 'InDelim' => $OptionsInfo{InDelim});
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
397 last FILEIOPARAMETERS;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
398 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
399 warn "Warning: File type for fingerprints file, $FingerprintsFile, is not valid. Supported file types: SD, FP or Text\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
400 next FILELIST;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
401 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
402
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
403 $FingerprintsFilesInfo{FileOkay}[$Index] = 1;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
404 $FingerprintsFilesInfo{FileType}[$Index] = $FileType;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
405
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
406 $FingerprintsFilesInfo{FileSize}[$Index] = FileSize($FingerprintsFile);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
407 ($ModifiedTimeString, $ModifiedDateString) = FormattedFileModificationTimeAndDate($FingerprintsFile);
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
408 $FingerprintsFilesInfo{FileLastModified}[$Index] = "$ModifiedTimeString; $ModifiedDateString";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
409
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
410 $FingerprintsFilesInfo{InDelim}[$Index] = $InDelim;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
411
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
412 %{$FingerprintsFilesInfo{FingerprintsFileIOParameters}[$Index]} = %FingerprintsFileIOParameters;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
413 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
414 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
415
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
416 # Process option values...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
417 sub ProcessOptions {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
418 %OptionsInfo = ();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
419
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
420 $OptionsInfo{ListAverageBitDensity} = ($Options{all} || $Options{averagebitdensity}) ? 1 :0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
421 $OptionsInfo{ListBitDensity} = ($Options{all} || $Options{bitdensity}) ? 1 :0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
422
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
423 if ($OptionsInfo{ListAverageBitDensity}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
424 # List bit density as well...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
425 $OptionsInfo{ListBitDensity} = 1;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
426 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
427
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
428 # By default, count number of rows containing fingerprints data...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
429 $OptionsInfo{CountFingerprints} = 1;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
430 $OptionsInfo{CountEmptyFingerprints} = ($Options{all} || $Options{empty}) ? 1 :0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
431
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
432 $OptionsInfo{ColMode} = $Options{colmode};
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
433 if (IsNotEmpty($Options{fingerprintscol})) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
434 if ($Options{colmode} =~ /^ColNum$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
435 if (!IsPositiveInteger($Options{fingerprintscol})) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
436 die "Error: Column value, $Options{fingerprintscol}, specified using \"--FingerprintsCol\" is not valid: Allowed integer values: > 0.\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
437 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
438 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
439 $OptionsInfo{FingerprintsCol} = $Options{fingerprintscol};
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
440 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
441 else {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
442 $OptionsInfo{FingerprintsCol} = 'AutoDetect';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
443 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
444
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
445 if (IsNotEmpty($Options{fingerprintsfield})) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
446 $OptionsInfo{FingerprintsFieldLabel} = $Options{fingerprintsfield};
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
447 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
448 else {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
449 $OptionsInfo{FingerprintsFieldLabel} = 'AutoDetect';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
450 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
451
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
452 $OptionsInfo{ValidateData} = ($Options{all} || $Options{datacheck}) ? 1 :0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
453 $OptionsInfo{DetailLevel} = $Options{detail};
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
454
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
455 $OptionsInfo{ListFingerprintsType} = ($Options{all} || $Options{fingerprintstype}) ? 1 :0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
456 $OptionsInfo{ListFingerprintsDescription} = ($Options{all} || $Options{fingerprintsdescription}) ? 1 :0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
457 $OptionsInfo{ListFingerprintsSize} = ($Options{all} || $Options{fingerprintssize}) ? 1 :0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
458
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
459 $OptionsInfo{ListFingerprintsBitStringFormat} = ($Options{all} || $Options{fingerprintsbitstringformat}) ? 1 :0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
460 $OptionsInfo{ListFingerprintsBitOrder} = ($Options{all} || $Options{fingerprintsbitorder}) ? 1 :0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
461
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
462 $OptionsInfo{ListFingerprintsVectorValuesType} = ($Options{all} || $Options{fingerprintsvectorvaluestype}) ? 1 :0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
463 $OptionsInfo{ListFingerprintsVectorValuesFormat} = ($Options{all} || $Options{fingerprintsvectorvaluesformat}) ? 1 :0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
464
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
465 $OptionsInfo{InDelim} = $Options{indelim};
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
466
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
467 $OptionsInfo{ListNumOfOnBits} = ($Options{all} || $Options{numofonbits}) ? 1 :0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
468 $OptionsInfo{ListNumOfNonZeroValues} = ($Options{all} || $Options{numofnonzerovalues}) ? 1 :0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
469
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
470 $OptionsInfo{ListFingerprintsDataEntryInfo} = ($OptionsInfo{ListFingerprintsType} || $OptionsInfo{ListFingerprintsDescription} || $OptionsInfo{ListFingerprintsSize} || $OptionsInfo{ListFingerprintsBitStringFormat} || $OptionsInfo{ListFingerprintsBitOrder} || $OptionsInfo{ListFingerprintsVectorValuesType} || $OptionsInfo{ListFingerprintsVectorValuesFormat} || $OptionsInfo{ListBitDensity} || $OptionsInfo{ListAverageBitDensity} || $OptionsInfo{ListNumOfOnBits} || $OptionsInfo{ListNumOfNonZeroValues}) ? 1 : 0;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
471
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
472 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
473
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
474 # Setup script usage and retrieve command line arguments specified using various options...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
475 sub SetupScriptUsage {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
476
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
477 # Retrieve all the options...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
478 %Options = ();
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
479
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
480 $Options{colmode} = 'colnum';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
481 $Options{detail} = 1;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
482 $Options{indelim} = 'comma';
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
483
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
484 if (!GetOptions(\%Options, "all|a", "averagebitdensity", "bitdensity", "count", "colmode|c=s", "detail|d=i", "datacheck", "empty|e", "fingerprintsfield=s", "fingerprintscol=s", "fingerprintstype", "fingerprintsdescription", "fingerprintssize", "fingerprintsbitstringformat", "fingerprintsbitorder", "fingerprintsvectorvaluestype", "fingerprintsvectorvaluesformat", "help|h", "indelim=s", "numofonbits", "numofnonzerovalues", "workingdir|w=s")) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
485 die "\nTo get a list of valid options and their values, use \"$ScriptName -h\" or\n\"perl -S $ScriptName -h\" command and try again...\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
486 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
487 if ($Options{workingdir}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
488 if (! -d $Options{workingdir}) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
489 die "Error: The value specified, $Options{workingdir}, for option \"-w --workingdir\" is not a directory name.\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
490 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
491 chdir $Options{workingdir} or die "Error: Couldn't chdir $Options{workingdir}: $! \n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
492 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
493 if ($Options{colmode} !~ /^(ColNum|ColLabel)$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
494 die "Error: The value specified, $Options{colmode}, for option \"-c, --ColMode\" is not valid. Allowed values: ColNum, or ColLabel\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
495 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
496 if (!IsPositiveInteger($Options{detail})) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
497 die "Error: The value specified, $Options{detail}, for option \"-d, --detail\" is not valid. Allowed values: > 0 \n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
498 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
499 if ($Options{indelim} !~ /^(comma|semicolon)$/i) {
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
500 die "Error: The value specified, $Options{indelim}, for option \"--InDelim\" is not valid. Allowed values: comma, or semicolon\n";
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
501 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
502 }
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
503
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
504 __END__
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
505
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
506 =head1 NAME
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
507
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
508 InfoFingerprintsFiles.pl - List information about fingerprints data in SD, FP and CSV/TSV text file(s)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
509
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
510 =head1 SYNOPSIS
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
511
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
512 InfoFingerprintsFiles.pl SDFile(s) FPFile(s) TextFile(s)...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
513
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
514 InfoFingerprintsFiles.pl [B<-a, --all>] [B<--AverageBitDensity>] [B<--BitDensity>]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
515 [B<-c, --count>] [B<-c, --ColMode> I<ColNum | ColLabel>] [B<--DataCheck>]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
516 [B<-d, --detail> I<InfoLevel>] [B<-e, --empty>] [B<--FingerprintsCol> I<col number | col name>]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
517 [B<--FingerprintsField> I<FieldLabel>] [B<--FingerprintsType>] [B<--FingerprintsDescription>]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
518 [B<--FingerprintsSize>] [B<--FingerprintsBitStringFormat>] [B<--FingerprintsBitOrder>]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
519 [B<--FingerprintsVectorValuesType>] [B<--FingerprintsVectorValuesFormat>]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
520 [B<-h, --help>] [B<--InDelim> I<comma | semicolon>]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
521 [B<--NumOfOnBits>] [B<--NumOfNonZeroValues>]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
522 [B<-w, --WorkingDir> dirname] SDFile(s) FPFile(s) TextFile(s)...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
523
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
524 =head1 DESCRIPTION
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
525
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
526 List information about fingerprints data in I<SD, FP and CSV/TSV> text file(s): number of
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
527 rows containing fingerprints data, type of fingerprints vector, description and size of fingerprints,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
528 bit density and average bit density for bit-vector fingerprints strings, and so on.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
529
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
530 The scripts InfoFingerprintsSDFiles.pl and InfoFingerprintsTextFiles.pl have been removed from the
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
531 current release of MayaChemTools and their functionality merged with this script.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
532
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
533 The valid I<SDFile> extensions are I<.sdf> and I<.sd>. All SD files in a current directory
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
534 can be specified either by I<*.sdf> or the current directory name.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
535
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
536 The valid I<FPFile> extensions are I<.fpf> and I<.fp>. All FP files in a current directory
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
537 can be specified either by I<*.fpf> or the current directory name.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
538
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
539 The valid I<TextFile> extensions are I<.csv> and I<.tsv> for comma/semicolon and tab
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
540 delimited text files respectively. All other file names are ignored. All text files in a
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
541 current directory can be specified by I<*.csv>, I<*.tsv>, or the current directory
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
542 name. The B<--indelim> option determines the format of I<TextFile(s)>. Any file
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
543 which doesn't correspond to the format indicated by B<--indelim> option is ignored.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
544
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
545 Format of fingerprint strings data in I<SDFile(s), FPFile(s) and TextFile(s)> is automatically
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
546 detected.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
547
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
548 Example of I<FP> file containing fingerprints bit-vector string data:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
549
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
550 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
551 # Package = MayaChemTools 7.4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
552 # ReleaseDate = Oct 21, 2010
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
553 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
554 # TimeStamp = Mon Mar 7 15:14:01 2011
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
555 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
556 # FingerprintsStringType = FingerprintsBitVector
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
557 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
558 # Description = PathLengthBits:AtomicInvariantsAtomTypes:MinLength1:...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
559 # Size = 1024
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
560 # BitStringFormat = HexadecimalString
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
561 # BitsOrder = Ascending
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
562 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
563 Cmpd1 9c8460989ec8a49913991a6603130b0a19e8051c89184414953800cc21510...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
564 Cmpd2 000000249400840040100042011001001980410c000000001010088001120...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
565 ... ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
566 ... ..
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
567
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
568 Example of I<FP> file containing fingerprints vector string data:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
569
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
570 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
571 # Package = MayaChemTools 7.4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
572 # ReleaseDate = Oct 21, 2010
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
573 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
574 # TimeStamp = Mon Mar 7 15:14:01 2011
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
575 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
576 # FingerprintsStringType = FingerprintsVector
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
577 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
578 # Description = PathLengthBits:AtomicInvariantsAtomTypes:MinLength1:...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
579 # VectorStringFormat = IDsAndValuesString
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
580 # VectorValuesType = NumericalValues
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
581 #
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
582 Cmpd1 338;C F N O C:C C:N C=O CC CF CN CO C:C:C C:C:N C:CC C:CF C:CN C:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
583 N:C C:NC CC:N CC=O CCC CCN CCO CNC NC=O O=CO C:C:C:C C:C:C:N C:C:CC...;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
584 33 1 2 5 21 2 2 12 1 3 3 20 2 10 2 2 1 2 2 2 8 2 5 1 1 1 19 2 8 2 2 2 2
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
585 6 2 2 2 2 2 2 2 2 3 2 2 1 4 1 5 1 1 18 6 2 2 1 2 10 2 1 2 1 2 2 2 2 ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
586 Cmpd2 103;C N O C=N C=O CC CN CO CC=O CCC CCN CCO CNC N=CN NC=O NCN O=C
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
587 O C CC=O CCCC CCCN CCCO CCNC CNC=N CNC=O CNCN CCCC=O CCCCC CCCCN CC...;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
588 15 4 4 1 2 13 5 2 2 15 5 3 2 2 1 1 1 2 17 7 6 5 1 1 1 2 15 8 5 7 2 2 2 2
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
589 1 2 1 1 3 15 7 6 8 3 4 4 3 2 2 1 2 3 14 2 4 7 4 4 4 4 1 1 1 2 1 1 1 ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
590 ... ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
591 ... ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
592
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
593 Example of I<SD> file containing fingerprints bit-vector string data:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
594
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
595 ... ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
596 ... ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
597 $$$$
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
598 ... ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
599 ... ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
600 ... ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
601 41 44 0 0 0 0 0 0 0 0999 V2000
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
602 -3.3652 1.4499 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
603 ... ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
604 2 3 1 0 0 0 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
605 ... ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
606 M END
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
607 > <CmpdID>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
608 Cmpd1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
609
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
610 > <PathLengthFingerprints>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
611 FingerprintsBitVector;PathLengthBits:AtomicInvariantsAtomTypes:MinLengt
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
612 h1:MaxLength8;1024;HexadecimalString;Ascending;9c8460989ec8a49913991a66
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
613 03130b0a19e8051c89184414953800cc2151082844a201042800130860308e8204d4028
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
614 00831048940e44281c00060449a5000ac80c894114e006321264401600846c050164462
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
615 08190410805000304a10205b0100e04c0038ba0fad0209c0ca8b1200012268b61c0026a
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
616 aa0660a11014a011d46
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
617
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
618 $$$$
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
619 ... ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
620 ... ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
621
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
622 Example of CSV I<Text> file containing fingerprints bit-vector string data:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
623
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
624 "CompoundID","PathLengthFingerprints"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
625 "Cmpd1","FingerprintsBitVector;PathLengthBits:AtomicInvariantsAtomTypes
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
626 :MinLength1:MaxLength8;1024;HexadecimalString;Ascending;9c8460989ec8a4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
627 9913991a6603130b0a19e8051c89184414953800cc2151082844a20104280013086030
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
628 8e8204d402800831048940e44281c00060449a5000ac80c894114e006321264401..."
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
629 ... ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
630 ... ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
631
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
632 The current release of MayaChemTools supports the following types of fingerprint
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
633 bit-vector and vector strings:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
634
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
635 FingerprintsVector;AtomNeighborhoods:AtomicInvariantsAtomTypes:MinRadi
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
636 us0:MaxRadius2;41;AlphaNumericalValues;ValuesString;NR0-C.X1.BO1.H3-AT
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
637 C1:NR1-C.X3.BO3.H1-ATC1:NR2-C.X1.BO1.H3-ATC1:NR2-C.X3.BO4-ATC1 NR0-C.X
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
638 1.BO1.H3-ATC1:NR1-C.X3.BO3.H1-ATC1:NR2-C.X1.BO1.H3-ATC1:NR2-C.X3.BO4-A
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
639 TC1 NR0-C.X2.BO2.H2-ATC1:NR1-C.X2.BO2.H2-ATC1:NR1-C.X3.BO3.H1-ATC1:NR2
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
640 -C.X2.BO2.H2-ATC1:NR2-N.X3.BO3-ATC1:NR2-O.X1.BO1.H1-ATC1 NR0-C.X2.B...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
641
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
642 FingerprintsVector;AtomTypesCount:AtomicInvariantsAtomTypes:ArbitraryS
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
643 ize;10;NumericalValues;IDsAndValuesString;C.X1.BO1.H3 C.X2.BO2.H2 C.X2
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
644 .BO3.H1 C.X3.BO3.H1 C.X3.BO4 F.X1.BO1 N.X2.BO2.H1 N.X3.BO3 O.X1.BO1.H1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
645 O.X1.BO2;2 4 14 3 10 1 1 1 3 2
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
646
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
647 FingerprintsVector;AtomTypesCount:SLogPAtomTypes:ArbitrarySize;16;Nume
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
648 ricalValues;IDsAndValuesString;C1 C10 C11 C14 C18 C20 C21 C22 C5 CS F
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
649 N11 N4 O10 O2 O9;5 1 1 1 14 4 2 1 2 2 1 1 1 1 3 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
650
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
651 FingerprintsVector;AtomTypesCount:SLogPAtomTypes:FixedSize;67;OrderedN
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
652 umericalValues;IDsAndValuesString;C1 C2 C3 C4 C5 C6 C7 C8 C9 C10 C11 C
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
653 12 C13 C14 C15 C16 C17 C18 C19 C20 C21 C22 C23 C24 C25 C26 C27 CS N1 N
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
654 2 N3 N4 N5 N6 N7 N8 N9 N10 N11 N12 N13 N14 NS O1 O2 O3 O4 O5 O6 O7 O8
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
655 O9 O10 O11 O12 OS F Cl Br I Hal P S1 S2 S3 Me1 Me2;5 0 0 0 2 0 0 0 0 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
656 1 0 0 1 0 0 0 14 0 4 2 1 0 0 0 0 0 2 0 0 0 1 0 0 0 0 0 0 1 0 0 0 0...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
657
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
658 FingerprintsVector;EStateIndicies:ArbitrarySize;11;NumericalValues;IDs
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
659 AndValuesString;SaaCH SaasC SaasN SdO SdssC SsCH3 SsF SsOH SssCH2 SssN
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
660 H SsssCH;24.778 4.387 1.993 25.023 -1.435 3.975 14.006 29.759 -0.073 3
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
661 .024 -2.270
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
662
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
663 FingerprintsVector;EStateIndicies:FixedSize;87;OrderedNumericalValues;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
664 ValuesString;0 0 0 0 0 0 0 3.975 0 -0.073 0 0 24.778 -2.270 0 0 -1.435
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
665 4.387 0 0 0 0 0 0 3.024 0 0 0 0 0 0 0 1.993 0 29.759 25.023 0 0 0 0 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
666 4.006 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
667 0 0 0 0 0 0 0 0 0 0 0 0 0 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
668
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
669 FingerprintsVector;ExtendedConnectivity:AtomicInvariantsAtomTypes:Radi
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
670 us2;60;AlphaNumericalValues;ValuesString;73555770 333564680 352413391
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
671 666191900 1001270906 1371674323 1481469939 1977749791 2006158649 21414
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
672 08799 49532520 64643108 79385615 96062769 273726379 564565671 85514103
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
673 5 906706094 988546669 1018231313 1032696425 1197507444 1331250018 1338
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
674 532734 1455473691 1607485225 1609687129 1631614296 1670251330 17303...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
675
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
676 FingerprintsVector;ExtendedConnectivityCount:AtomicInvariantsAtomTypes
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
677 :Radius2;60;NumericalValues;IDsAndValuesString;73555770 333564680 3524
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
678 13391 666191900 1001270906 1371674323 1481469939 1977749791 2006158649
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
679 2141408799 49532520 64643108 79385615 96062769 273726379 564565671...;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
680 3 2 1 1 14 1 2 10 4 3 1 1 1 1 2 1 2 1 1 1 2 3 1 1 2 1 3 3 8 2 2 2 6 2
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
681 1 2 1 1 2 1 1 1 2 1 1 2 1 2 1 1 1 1 1 1 1 1 1 2 1 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
682
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
683 FingerprintsBitVector;ExtendedConnectivityBits:AtomicInvariantsAtomTyp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
684 es:Radius2;1024;BinaryString;Ascending;0000000000000000000000000000100
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
685 0000000001010000000110000011000000000000100000000000000000000000100001
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
686 1000000110000000000000000000000000010011000000000000000000000000010000
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
687 0000000000000000000000000010000000000000000001000000000000000000000000
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
688 0000000000010000100001000000000000101000000000000000100000000000000...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
689
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
690 FingerprintsVector;ExtendedConnectivity:FunctionalClassAtomTypes:Radiu
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
691 s2;57;AlphaNumericalValues;ValuesString;24769214 508787397 850393286 8
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
692 62102353 981185303 1231636850 1649386610 1941540674 263599683 32920567
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
693 1 571109041 639579325 683993318 723853089 810600886 885767127 90326012
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
694 7 958841485 981022393 1126908698 1152248391 1317567065 1421489994 1455
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
695 632544 1557272891 1826413669 1983319256 2015750777 2029559552 20404...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
696
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
697 FingerprintsVector;ExtendedConnectivity:EStateAtomTypes:Radius2;62;Alp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
698 haNumericalValues;ValuesString;25189973 528584866 662581668 671034184
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
699 926543080 1347067490 1738510057 1759600920 2034425745 2097234755 21450
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
700 44754 96779665 180364292 341712110 345278822 386540408 387387308 50430
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
701 1706 617094135 771528807 957666640 997798220 1158349170 1291258082 134
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
702 1138533 1395329837 1420277211 1479584608 1486476397 1487556246 1566...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
703
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
704 FingerprintsBitVector;MACCSKeyBits;166;BinaryString;Ascending;00000000
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
705 0000000000000000000000000000000001001000010010000000010010000000011100
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
706 0100101010111100011011000100110110000011011110100110111111111111011111
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
707 11111111111110111000
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
708
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
709 FingerprintsBitVector;MACCSKeyBits;322;BinaryString;Ascending;11101011
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
710 1110011111100101111111000111101100110000000000000011100010000000000000
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
711 0000000000000000000000000000000000000000000000101000000000000000000000
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
712 0000000000000000000000000000000000000000000000000000000000000000000000
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
713 0000000000000000000000000000000000000011000000000000000000000000000000
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
714 0000000000000000000000000000000000000000
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
715
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
716 FingerprintsVector;MACCSKeyCount;166;OrderedNumericalValues;ValuesStri
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
717 ng;0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
718 0 0 0 0 0 0 0 1 0 0 3 0 0 0 0 4 0 0 2 0 0 0 0 0 0 0 0 2 0 0 2 0 0 0 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
719 0 0 0 0 1 1 8 0 0 0 1 0 0 1 0 1 0 1 0 3 1 3 1 0 0 0 1 2 0 11 1 0 0 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
720 5 0 0 1 2 0 1 1 0 0 0 0 0 1 1 0 1 1 1 1 0 4 0 0 1 1 0 4 6 1 1 1 2 1 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
721 3 5 2 2 0 5 3 5 1 1 2 5 1 2 1 2 4 8 3 5 5 2 2 0 3 5 4 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
722
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
723 FingerprintsVector;MACCSKeyCount;322;OrderedNumericalValues;ValuesStri
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
724 ng;14 8 2 0 2 0 4 4 2 1 4 0 0 2 5 10 5 2 1 0 0 2 0 5 13 3 28 5 5 3 0 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
725 0 4 2 1 1 0 1 1 0 0 2 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 22 5 3 0 0 0 1 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
726 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
727 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 11 0 2 0 0 0 0 0 0 0 0 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
728 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
729
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
730 FingerprintsBitVector;PathLengthBits:AtomicInvariantsAtomTypes:MinLeng
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
731 th1:MaxLength8;1024;BinaryString;Ascending;001000010011010101011000110
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
732 0100010101011000101001011100110001000010001001101000001001001001001000
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
733 0010110100000111001001000001001010100100100000000011000000101001011100
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
734 0010000001000101010100000100111100110111011011011000000010110111001101
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
735 0101100011000000010001000011000010100011101100001000001000100000000...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
736
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
737 FingerprintsVector;PathLengthCount:AtomicInvariantsAtomTypes:MinLength
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
738 1:MaxLength8;432;NumericalValues;IDsAndValuesPairsString;C.X1.BO1.H3 2
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
739 C.X2.BO2.H2 4 C.X2.BO3.H1 14 C.X3.BO3.H1 3 C.X3.BO4 10 F.X1.BO1 1 N.X
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
740 2.BO2.H1 1 N.X3.BO3 1 O.X1.BO1.H1 3 O.X1.BO2 2 C.X1.BO1.H3C.X3.BO3.H1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
741 2 C.X2.BO2.H2C.X2.BO2.H2 1 C.X2.BO2.H2C.X3.BO3.H1 4 C.X2.BO2.H2C.X3.BO
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
742 4 1 C.X2.BO2.H2N.X3.BO3 1 C.X2.BO3.H1:C.X2.BO3.H1 10 C.X2.BO3.H1:C....
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
743
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
744 FingerprintsVector;PathLengthCount:MMFF94AtomTypes:MinLength1:MaxLengt
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
745 h8;463;NumericalValues;IDsAndValuesPairsString;C5A 2 C5B 2 C=ON 1 CB 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
746 8 COO 1 CR 9 F 1 N5 1 NC=O 1 O=CN 1 O=CO 1 OC=O 1 OR 2 C5A:C5B 2 C5A:N
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
747 5 2 C5ACB 1 C5ACR 1 C5B:C5B 1 C5BC=ON 1 C5BCB 1 C=ON=O=CN 1 C=ONNC=O 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
748 CB:CB 18 CBF 1 CBNC=O 1 COO=O=CO 1 COOCR 1 COOOC=O 1 CRCR 7 CRN5 1 CR
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
749 OR 2 C5A:C5B:C5B 2 C5A:C5BC=ON 1 C5A:C5BCB 1 C5A:N5:C5A 1 C5A:N5CR ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
750
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
751 FingerprintsVector;TopologicalAtomPairs:AtomicInvariantsAtomTypes:MinD
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
752 istance1:MaxDistance10;223;NumericalValues;IDsAndValuesString;C.X1.BO1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
753 .H3-D1-C.X3.BO3.H1 C.X2.BO2.H2-D1-C.X2.BO2.H2 C.X2.BO2.H2-D1-C.X3.BO3.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
754 H1 C.X2.BO2.H2-D1-C.X3.BO4 C.X2.BO2.H2-D1-N.X3.BO3 C.X2.BO3.H1-D1-...;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
755 2 1 4 1 1 10 8 1 2 6 1 2 2 1 2 1 2 2 1 2 1 5 1 10 12 2 2 1 2 1 9 1 3 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
756 1 1 2 2 1 3 6 1 6 14 2 2 2 3 1 3 1 8 2 2 1 3 2 6 1 2 2 5 1 3 1 23 1...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
757
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
758 FingerprintsVector;TopologicalAtomPairs:FunctionalClassAtomTypes:MinDi
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
759 stance1:MaxDistance10;144;NumericalValues;IDsAndValuesString;Ar-D1-Ar
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
760 Ar-D1-Ar.HBA Ar-D1-HBD Ar-D1-Hal Ar-D1-None Ar.HBA-D1-None HBA-D1-NI H
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
761 BA-D1-None HBA.HBD-D1-NI HBA.HBD-D1-None HBD-D1-None NI-D1-None No...;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
762 23 2 1 1 2 1 1 1 1 2 1 1 7 28 3 1 3 2 8 2 1 1 1 5 1 5 24 3 3 4 2 13 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
763 1 1 4 1 5 22 4 4 3 1 19 1 1 1 1 1 2 2 3 1 1 8 25 4 5 2 3 1 26 1 4 1 ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
764
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
765 FingerprintsVector;TopologicalAtomTorsions:AtomicInvariantsAtomTypes;3
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
766 3;NumericalValues;IDsAndValuesString;C.X1.BO1.H3-C.X3.BO3.H1-C.X3.BO4-
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
767 C.X3.BO4 C.X1.BO1.H3-C.X3.BO3.H1-C.X3.BO4-N.X3.BO3 C.X2.BO2.H2-C.X2.BO
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
768 2.H2-C.X3.BO3.H1-C.X2.BO2.H2 C.X2.BO2.H2-C.X2.BO2.H2-C.X3.BO3.H1-O...;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
769 2 2 1 1 2 2 1 1 3 4 4 8 4 2 2 6 2 2 1 2 1 1 2 1 1 2 6 2 4 2 1 3 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
770
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
771 FingerprintsVector;TopologicalAtomTorsions:EStateAtomTypes;36;Numerica
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
772 lValues;IDsAndValuesString;aaCH-aaCH-aaCH-aaCH aaCH-aaCH-aaCH-aasC aaC
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
773 H-aaCH-aasC-aaCH aaCH-aaCH-aasC-aasC aaCH-aaCH-aasC-sF aaCH-aaCH-aasC-
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
774 ssNH aaCH-aasC-aasC-aasC aaCH-aasC-aasC-aasN aaCH-aasC-ssNH-dssC a...;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
775 4 4 8 4 2 2 6 2 2 2 4 3 2 1 3 3 2 2 2 1 2 1 1 1 2 1 1 1 1 1 1 1 2 1 1 2
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
776
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
777 FingerprintsVector;TopologicalAtomTriplets:AtomicInvariantsAtomTypes:M
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
778 inDistance1:MaxDistance10;3096;NumericalValues;IDsAndValuesString;C.X1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
779 .BO1.H3-D1-C.X1.BO1.H3-D1-C.X3.BO3.H1-D2 C.X1.BO1.H3-D1-C.X2.BO2.H2-D1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
780 0-C.X3.BO4-D9 C.X1.BO1.H3-D1-C.X2.BO2.H2-D3-N.X3.BO3-D4 C.X1.BO1.H3-D1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
781 -C.X2.BO2.H2-D4-C.X2.BO2.H2-D5 C.X1.BO1.H3-D1-C.X2.BO2.H2-D6-C.X3....;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
782 1 2 2 2 2 2 2 2 8 8 4 8 4 4 2 2 2 2 4 2 2 2 4 2 2 2 2 1 2 2 4 4 4 2 2
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
783 2 4 4 4 8 4 4 2 4 4 4 2 4 4 2 2 2 2 2 2 2 2 1 2 2 2 2 2 2 2 2 2 2 8...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
784
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
785 FingerprintsVector;TopologicalAtomTriplets:SYBYLAtomTypes:MinDistance1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
786 :MaxDistance10;2332;NumericalValues;IDsAndValuesString;C.2-D1-C.2-D9-C
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
787 .3-D10 C.2-D1-C.2-D9-C.ar-D10 C.2-D1-C.3-D1-C.3-D2 C.2-D1-C.3-D10-C.3-
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
788 D9 C.2-D1-C.3-D2-C.3-D3 C.2-D1-C.3-D2-C.ar-D3 C.2-D1-C.3-D3-C.3-D4 C.2
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
789 -D1-C.3-D3-N.ar-D4 C.2-D1-C.3-D3-O.3-D2 C.2-D1-C.3-D4-C.3-D5 C.2-D1-C.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
790 3-D5-C.3-D6 C.2-D1-C.3-D5-O.3-D4 C.2-D1-C.3-D6-C.3-D7 C.2-D1-C.3-D7...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
791
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
792 FingerprintsVector;TopologicalPharmacophoreAtomPairs:ArbitrarySize:Min
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
793 Distance1:MaxDistance10;54;NumericalValues;IDsAndValuesString;H-D1-H H
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
794 -D1-NI HBA-D1-NI HBD-D1-NI H-D2-H H-D2-HBA H-D2-HBD HBA-D2-HBA HBA-D2-
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
795 HBD H-D3-H H-D3-HBA H-D3-HBD H-D3-NI HBA-D3-NI HBD-D3-NI H-D4-H H-D4-H
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
796 BA H-D4-HBD HBA-D4-HBA HBA-D4-HBD HBD-D4-HBD H-D5-H H-D5-HBA H-D5-...;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
797 18 1 2 1 22 12 8 1 2 18 6 3 1 1 1 22 13 6 5 7 2 28 9 5 1 1 1 36 16 10
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
798 3 4 1 37 10 8 1 35 10 9 3 3 1 28 7 7 4 18 16 12 5 1 2 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
799
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
800 FingerprintsVector;TopologicalPharmacophoreAtomPairs:FixedSize:MinDist
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
801 ance1:MaxDistance10;150;OrderedNumericalValues;ValuesString;18 0 0 1 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
802 0 0 2 0 0 1 0 0 0 0 22 12 8 0 0 1 2 0 0 0 0 0 0 0 0 18 6 3 1 0 0 0 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
803 0 0 1 0 0 0 0 22 13 6 0 0 5 7 0 0 2 0 0 0 0 0 28 9 5 1 0 0 0 1 0 0 1 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
804 0 0 0 36 16 10 0 0 3 4 0 0 1 0 0 0 0 0 37 10 8 0 0 0 0 1 0 0 0 0 0 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
805 0 35 10 9 0 0 3 3 0 0 1 0 0 0 0 0 28 7 7 4 0 0 0 0 0 0 0 0 0 0 0 18...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
806
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
807 FingerprintsVector;TopologicalPharmacophoreAtomTriplets:ArbitrarySize:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
808 MinDistance1:MaxDistance10;696;NumericalValues;IDsAndValuesString;Ar1-
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
809 Ar1-Ar1 Ar1-Ar1-H1 Ar1-Ar1-HBA1 Ar1-Ar1-HBD1 Ar1-H1-H1 Ar1-H1-HBA1 Ar1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
810 -H1-HBD1 Ar1-HBA1-HBD1 H1-H1-H1 H1-H1-HBA1 H1-H1-HBD1 H1-HBA1-HBA1 H1-
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
811 HBA1-HBD1 H1-HBA1-NI1 H1-HBD1-NI1 HBA1-HBA1-NI1 HBA1-HBD1-NI1 Ar1-...;
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
812 46 106 8 3 83 11 4 1 21 5 3 1 2 2 1 1 1 100 101 18 11 145 132 26 14 23
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
813 28 3 3 5 4 61 45 10 4 16 20 7 5 1 3 4 5 3 1 1 1 1 5 4 2 1 2 2 2 1 1 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
814 119 123 24 15 185 202 41 25 22 17 3 5 85 95 18 11 23 17 3 1 1 6 4 ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
815
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
816 FingerprintsVector;TopologicalPharmacophoreAtomTriplets:FixedSize:MinD
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
817 istance1:MaxDistance10;2692;OrderedNumericalValues;ValuesString;46 106
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
818 8 3 0 0 83 11 4 0 0 0 1 0 0 0 0 0 0 0 0 21 5 3 0 0 1 2 2 0 0 1 0 0 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
819 0 0 0 1 0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 100 101 18 11 0 0 145 132 26
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
820 14 0 0 23 28 3 3 0 0 5 4 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 61 45 10 4 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
821 0 16 20 7 5 1 0 3 4 5 3 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 1 1 0 0 5 ...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
822
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
823 =head1 OPTIONS
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
824
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
825 =over 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
826
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
827 =item B<-a, --all>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
828
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
829 List all the available information.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
830
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
831 =item B<--AverageBitDensity>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
832
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
833 List average bit density of fingerprint bit-vector strings.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
834
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
835 =item B<--BitDensity>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
836
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
837 List bit density of fingerprints bit-vector strings data in each row.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
838
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
839 =item B<--count>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
840
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
841 List number of data entries containing fingerprints bit-vector or vector strings data. This
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
842 is B<default behavior>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
843
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
844 =item B<-c, --ColMode> I<ColNum | ColLabel>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
845
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
846 Specify how columns are identified in CSV/TSV I<TextFile(s)>: using column number or column
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
847 label. Possible values: I<ColNum or ColLabel>. Default value: I<ColNum>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
848
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
849 =item B<-d, --detail> I<InfoLevel>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
850
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
851 Level of information to print about lines being ignored. Default: I<1>. Possible values:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
852 I<1, 2 or 3>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
853
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
854 =item B<--DataCheck>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
855
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
856 Validate fingerprints data specified using B<--FingerprintsCol> and list information
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
857 about missing and invalid data.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
858
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
859 =item B<-e, --empty>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
860
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
861 List number of rows containing no fingerprints data.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
862
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
863 =item B<--FingerprintsCol> I<col number | col name>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
864
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
865 This value is B<-c, --colmode> specific. It corresponds to column in CSV/TSV I<TextFile(s)>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
866 containing fingerprints data. Possible values: I<col number or col label>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
867 Default value: I<first column containing the word Fingerprints in its column label>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
868
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
869 =item B<--FingerprintsField> I<FieldLabel>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
870
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
871 Fingerprints field label to use during listing of fingerprints information for I<SDFile(s)>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
872 Default value: I<first data field label containing the word Fingerprints in its label>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
873
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
874 =item B<--FingerprintsType>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
875
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
876 List types of fingerprint strings: FingerprintsBitVector or FingerprintsVector.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
877
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
878 =item B<--FingerprintsDescription>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
879
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
880 List types of fingerprints: PathLengthBits, PathLengthCount, MACCSKeyCount,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
881 ExtendedConnectivity and so on.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
882
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
883 =item B<--FingerprintsSize>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
884
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
885 List size of fingerprints.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
886
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
887 =item B<--FingerprintsBitStringFormat>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
888
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
889 List format of fingerprint bit-vector strings: BinaryString or HexadecimalString.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
890
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
891 =item B<--FingerprintsBitOrder>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
892
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
893 List order of bits data in fingerprint bit-vector bit strings: Ascending or Descending.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
894
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
895 =item B<--FingerprintsVectorValuesType>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
896
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
897 List type of values in fingerprint vector strings: OrderedNumericalValues, NumericalValues or
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
898 AlphaNumericalValues.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
899
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
900 =item B<--FingerprintsVectorValuesFormat>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
901
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
902 List format of values in fingerprint vector strings: ValuesString, IDsAndValuesString,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
903 IDsAndValuesPairsString, ValuesAndIDsString or ValuesAndIDsPairsString.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
904
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
905 =item B<-h, --help>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
906
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
907 Print this help message.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
908
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
909 =item B<--InDelim> I<comma | semicolon>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
910
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
911 Input delimiter for CSV I<TextFile(s)>. Possible values: I<comma or semicolon>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
912 Default value: I<comma>. For TSV files, this option is ignored and I<tab> is used as a
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
913 delimiter.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
914
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
915 =item B<--NumOfOnBits>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
916
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
917 List number of on bits in fingerprints bit-vector strings data in each row.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
918
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
919 =item B<--NumOfNonZeroValues>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
920
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
921 List number of non-zero values in fingerprints vector strings data in each row.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
922
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
923 =item B<-w, --WorkingDir> I<DirName>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
924
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
925 Location of working directory. Default: current directory.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
926
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
927 =back
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
928
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
929 =head1 EXAMPLES
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
930
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
931 To count number of lines containing fingerprints bit-vector or vector strings data present
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
932 in FP file, in a column name containing Fingerprint substring in text file, and in a data
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
933 field with Fingerprint substring in its label, type:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
934
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
935 % InfoFingerprintsFiles.pl SampleFPBin.csv
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
936
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
937 % InfoFingerprintsFiles.pl SampleFPBin.sdf SampleFPBin.fpf
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
938 SampleFPBin.csv
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
939
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
940 % InfoFingerprintsFiles.pl SampleFPHex.sdf SampleFPHex.fpf
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
941 SampleFPHex.csv
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
942
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
943 % InfoFingerprintsFiles.pl SampleFPcount.sdf SampleFPcount.fpf
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
944 SampleFPcount.csv
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
945
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
946 To list all available information about fingerprints bit-vector or vector strings data present
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
947 in FP file, in a column name containing Fingerprint substring in text file, and in a data
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
948 field with Fingerprint substring in its label, type:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
949
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
950 % InfoFingerprintsFiles.pl -a SampleFPHex.sdf SampleFPHex.fpf
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
951 SampleFPHex.csv
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
952
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
953 % InfoFingerprintsFiles.pl -a SampleFPcount.sdf SampleFPcount.fpf
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
954 SampleFPcount.csv
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
955
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
956 To list all available information about fingerprints bit-vector or vector strings data present in a
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
957 column named Fingerprints in text file, type:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
958
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
959 % InfoFingerprintsFiles.pl -a --ColMode ColLabel --FingerprintsCol
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
960 Fingerprints SampleFPHex.sdf
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
961
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
962 % InfoFingerprintsFiles.pl -a --ColMode ColLabel --FingerprintsCol
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
963 Fingerprints SampleFPcount.csv
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
964
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
965 To list all available information about fingerprints bit-vector or vector strings data present in a
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
966 data field names Fingerprints in SD file, type:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
967
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
968 % InfoFingerprintsFiles.pl -a --FingerprintsField Fingerprints
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
969 SampleFPHex.sdf
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
970
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
971 % InfoFingerprintsFiles.pl -a --FingerprintsField Fingerprints
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
972 SampleFPcount.sdf
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
973
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
974 To list bit density, average bit density, and number of on bits for fingerprints bit-vector strings data
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
975 present in FP file, in a column name containing Fingerprint substring in text file, and in a data
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
976 field with Fingerprint substring in its label, type:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
977
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
978 % InfoFingerprintsFiles.pl --BitDensity --AverageBitDensity
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
979 --NumOfOnBits SampleFPBin.csv SampleFPBin.sdf SampleFPBin.fpf
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
980
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
981 To list vector values type, format and number of non-zero values for fingerprints vector strings
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
982 data present in FP file, in a column name containing Fingerprint substring in text file, and in a data
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
983 field with Fingerprint substring in its label along with fingerprints type and description, type:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
984
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
985 % InfoFingerprintsFiles.pl --FingerprintsType --FingerprintsDescription
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
986 --FingerprintsVectorValuesType --FingerprintsVectorValuesFormat
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
987 --NumOfNonZeroValues SampleFPcount.csv SampleFPcount.sdf
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
988 SampleFPcount.fpf
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
989
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
990 =head1 AUTHOR
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
991
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
992 Manish Sud <msud@san.rr.com>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
993
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
994 =head1 SEE ALSO
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
995
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
996 SimilarityMatricesFingerprints.pl, SimilaritySearchingFingerprints.pl, AtomNeighborhoodsFingerprints.pl,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
997 AtomNeighborhoodsFingerprints.pl, ExtendedConnectivityFingerprints.pl, MACCSKeysFingerprints.pl,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
998 PathLengthFingerprints.pl, TopologicalAtomPairsFingerprints.pl, TopologicalAtomTorsionsFingerprints.pl,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
999 TopologicalPharmacophoreAtomPairsFingerprints.pl, TopologicalPharmacophoreAtomTripletsFingerprints.pl
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1000
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1001 =head1 COPYRIGHT
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1002
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1003 Copyright (C) 2015 Manish Sud. All rights reserved.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1004
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1005 This file is part of MayaChemTools.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1006
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1007 MayaChemTools is free software; you can redistribute it and/or modify it under
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1008 the terms of the GNU Lesser General Public License as published by the Free
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1009 Software Foundation; either version 3 of the License, or (at your option)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1010 any later version.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1011
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1012 =cut