comparison docs/scripts/man1/EStateIndiciesFingerprints.1 @ 0:4816e4a8ae95 draft default tip

Uploaded
author deepakjadmin
date Wed, 20 Jan 2016 09:23:18 -0500
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:4816e4a8ae95
1 .\" Automatically generated by Pod::Man 2.25 (Pod::Simple 3.22)
2 .\"
3 .\" Standard preamble:
4 .\" ========================================================================
5 .de Sp \" Vertical space (when we can't use .PP)
6 .if t .sp .5v
7 .if n .sp
8 ..
9 .de Vb \" Begin verbatim text
10 .ft CW
11 .nf
12 .ne \\$1
13 ..
14 .de Ve \" End verbatim text
15 .ft R
16 .fi
17 ..
18 .\" Set up some character translations and predefined strings. \*(-- will
19 .\" give an unbreakable dash, \*(PI will give pi, \*(L" will give a left
20 .\" double quote, and \*(R" will give a right double quote. \*(C+ will
21 .\" give a nicer C++. Capital omega is used to do unbreakable dashes and
22 .\" therefore won't be available. \*(C` and \*(C' expand to `' in nroff,
23 .\" nothing in troff, for use with C<>.
24 .tr \(*W-
25 .ds C+ C\v'-.1v'\h'-1p'\s-2+\h'-1p'+\s0\v'.1v'\h'-1p'
26 .ie n \{\
27 . ds -- \(*W-
28 . ds PI pi
29 . if (\n(.H=4u)&(1m=24u) .ds -- \(*W\h'-12u'\(*W\h'-12u'-\" diablo 10 pitch
30 . if (\n(.H=4u)&(1m=20u) .ds -- \(*W\h'-12u'\(*W\h'-8u'-\" diablo 12 pitch
31 . ds L" ""
32 . ds R" ""
33 . ds C` ""
34 . ds C' ""
35 'br\}
36 .el\{\
37 . ds -- \|\(em\|
38 . ds PI \(*p
39 . ds L" ``
40 . ds R" ''
41 'br\}
42 .\"
43 .\" Escape single quotes in literal strings from groff's Unicode transform.
44 .ie \n(.g .ds Aq \(aq
45 .el .ds Aq '
46 .\"
47 .\" If the F register is turned on, we'll generate index entries on stderr for
48 .\" titles (.TH), headers (.SH), subsections (.SS), items (.Ip), and index
49 .\" entries marked with X<> in POD. Of course, you'll have to process the
50 .\" output yourself in some meaningful fashion.
51 .ie \nF \{\
52 . de IX
53 . tm Index:\\$1\t\\n%\t"\\$2"
54 ..
55 . nr % 0
56 . rr F
57 .\}
58 .el \{\
59 . de IX
60 ..
61 .\}
62 .\"
63 .\" Accent mark definitions (@(#)ms.acc 1.5 88/02/08 SMI; from UCB 4.2).
64 .\" Fear. Run. Save yourself. No user-serviceable parts.
65 . \" fudge factors for nroff and troff
66 .if n \{\
67 . ds #H 0
68 . ds #V .8m
69 . ds #F .3m
70 . ds #[ \f1
71 . ds #] \fP
72 .\}
73 .if t \{\
74 . ds #H ((1u-(\\\\n(.fu%2u))*.13m)
75 . ds #V .6m
76 . ds #F 0
77 . ds #[ \&
78 . ds #] \&
79 .\}
80 . \" simple accents for nroff and troff
81 .if n \{\
82 . ds ' \&
83 . ds ` \&
84 . ds ^ \&
85 . ds , \&
86 . ds ~ ~
87 . ds /
88 .\}
89 .if t \{\
90 . ds ' \\k:\h'-(\\n(.wu*8/10-\*(#H)'\'\h"|\\n:u"
91 . ds ` \\k:\h'-(\\n(.wu*8/10-\*(#H)'\`\h'|\\n:u'
92 . ds ^ \\k:\h'-(\\n(.wu*10/11-\*(#H)'^\h'|\\n:u'
93 . ds , \\k:\h'-(\\n(.wu*8/10)',\h'|\\n:u'
94 . ds ~ \\k:\h'-(\\n(.wu-\*(#H-.1m)'~\h'|\\n:u'
95 . ds / \\k:\h'-(\\n(.wu*8/10-\*(#H)'\z\(sl\h'|\\n:u'
96 .\}
97 . \" troff and (daisy-wheel) nroff accents
98 .ds : \\k:\h'-(\\n(.wu*8/10-\*(#H+.1m+\*(#F)'\v'-\*(#V'\z.\h'.2m+\*(#F'.\h'|\\n:u'\v'\*(#V'
99 .ds 8 \h'\*(#H'\(*b\h'-\*(#H'
100 .ds o \\k:\h'-(\\n(.wu+\w'\(de'u-\*(#H)/2u'\v'-.3n'\*(#[\z\(de\v'.3n'\h'|\\n:u'\*(#]
101 .ds d- \h'\*(#H'\(pd\h'-\w'~'u'\v'-.25m'\f2\(hy\fP\v'.25m'\h'-\*(#H'
102 .ds D- D\\k:\h'-\w'D'u'\v'-.11m'\z\(hy\v'.11m'\h'|\\n:u'
103 .ds th \*(#[\v'.3m'\s+1I\s-1\v'-.3m'\h'-(\w'I'u*2/3)'\s-1o\s+1\*(#]
104 .ds Th \*(#[\s+2I\s-2\h'-\w'I'u*3/5'\v'-.3m'o\v'.3m'\*(#]
105 .ds ae a\h'-(\w'a'u*4/10)'e
106 .ds Ae A\h'-(\w'A'u*4/10)'E
107 . \" corrections for vroff
108 .if v .ds ~ \\k:\h'-(\\n(.wu*9/10-\*(#H)'\s-2\u~\d\s+2\h'|\\n:u'
109 .if v .ds ^ \\k:\h'-(\\n(.wu*10/11-\*(#H)'\v'-.4m'^\v'.4m'\h'|\\n:u'
110 . \" for low resolution devices (crt and lpr)
111 .if \n(.H>23 .if \n(.V>19 \
112 \{\
113 . ds : e
114 . ds 8 ss
115 . ds o a
116 . ds d- d\h'-1'\(ga
117 . ds D- D\h'-1'\(hy
118 . ds th \o'bp'
119 . ds Th \o'LP'
120 . ds ae ae
121 . ds Ae AE
122 .\}
123 .rm #[ #] #H #V #F C
124 .\" ========================================================================
125 .\"
126 .IX Title "ESTATEINDICIESFINGERPRINTS 1"
127 .TH ESTATEINDICIESFINGERPRINTS 1 "2015-03-29" "perl v5.14.2" "MayaChemTools"
128 .\" For nroff, turn off justification. Always turn off hyphenation; it makes
129 .\" way too many mistakes in technical documents.
130 .if n .ad l
131 .nh
132 .SH "NAME"
133 EStateIndiciesFingerprints.pl \- Generate E\-state indicies fingerprints for SD files
134 .SH "SYNOPSIS"
135 .IX Header "SYNOPSIS"
136 EStateIndiciesFingerprints.pl SDFile(s)...
137 .PP
138 EStateIndiciesFingerprints.pl [\fB\-\-AromaticityModel\fR \fIAromaticityModelType\fR]
139 [\fB\-\-CompoundID\fR \fIDataFieldName or LabelPrefixString\fR]
140 [\fB\-\-CompoundIDLabel\fR \fItext\fR] [\fB\-\-CompoundIDMode\fR \fIDataField | MolName | LabelPrefix | MolNameOrLabelPrefix\fR]
141 [\fB\-\-DataFields\fR \fI\*(L"FieldLabel1,FieldLabel2,...\*(R"\fR] [\fB\-d, \-\-DataFieldsMode\fR \fIAll | Common | Specify | CompoundID\fR]
142 [\fB\-e, \-\-EStateAtomTypesSetToUse\fR \fIArbitrarySize or FixedSize\fR] [\fB\-f, \-\-Filter\fR \fIYes | No\fR]
143 [\fB\-\-FingerprintsLabelMode\fR \fIFingerprintsLabelOnly | FingerprintsLabelWithIDs\fR] [\fB\-\-FingerprintsLabel\fR \fItext\fR]
144 [\fB\-h, \-\-help\fR] [\fB\-k, \-\-KeepLargestComponent\fR \fIYes | No\fR]
145 [\fB\-\-OutDelim\fR \fIcomma | tab | semicolon\fR] [\fB\-\-output\fR \fI\s-1SD\s0 | \s-1FP\s0 | text | all\fR] [\fB\-o, \-\-overwrite\fR]
146 [\fB\-q, \-\-quote\fR \fIYes | No\fR] [\fB\-r, \-\-root\fR \fIRootName\fR] [\fB\-s, \-\-size\fR \fInumber\fR] [\fB\-\-ValuesPrecision\fR \fInumber\fR]
147 [\fB\-v, \-\-VectorStringFormat\fR \fIIDsAndValuesString | IDsAndValuesPairsString | ValuesAndIDsString | ValuesAndIDsPairsString\fR]
148 [\fB\-w, \-\-WorkingDir\fR \fIDirName\fR]
149 .SH "DESCRIPTION"
150 .IX Header "DESCRIPTION"
151 Generate E\-state indicies fingerprints [ Ref 75\-78 ] for \fISDFile(s)\fR and create appropriate \s-1SD\s0,
152 \&\s-1FP\s0, or \s-1CSV/TSV\s0 text file(s) containing fingerprints bit-vector or vector strings corresponding to
153 molecular fingerprints.
154 .PP
155 Multiple SDFile names are separated by spaces. The valid file extensions are \fI.sdf\fR
156 and \fI.sd\fR. All other file names are ignored. All the \s-1SD\s0 files in a current directory
157 can be specified either by \fI*.sdf\fR or the current directory name.
158 .PP
159 E\-state atom types are assigned to all non-hydrogen atoms in a molecule using module
160 AtomTypes::EStateAtomTypes.pm and E\-state values are calculated using module
161 AtomicDescriptors::EStateValues.pm. Using E\-state atom types and E\-state values,
162 \&\fBEStateIndiciesFingerprints\fR constituting sum of E\-state values for E\-sate atom types
163 is generated.
164 .PP
165 Two types of E\-state atom types set size are allowed:
166 .PP
167 .Vb 4
168 \& ArbitrarySize \- Corresponds to only E\-state atom types detected
169 \& in molecule
170 \& FixedSize \- Corresponds to fixed number of E\-state atom types previously
171 \& defined
172 .Ve
173 .PP
174 Module AtomTypes::EStateAtomTypes.pm, used to assign E\-state atom types to
175 non-hydrogen atoms in the molecule, is able to assign atom types to any valid
176 atom group. However, for \fIFixedSize\fR value of \fBEStateAtomTypesSetToUse\fR, only a
177 fixed set of E\-state atom types corresponding to specific atom groups [ Appendix \s-1III\s0 in
178 Ref 77 ] are used for fingerprints.
179 .PP
180 The fixed size E\-state atom type set size used during generation of fingerprints contains
181 87 E\-state non-hydrogen atom types in EStateAtomTypes.csv data file distributed with
182 MayaChemTools.
183 .PP
184 Combination of Type and EStateAtomTypesSetToUse allow generation of 2 different types of
185 E\-state indicies fingerprints:
186 .PP
187 .Vb 1
188 \& Type EStateAtomTypesSetToUse
189 \&
190 \& EStateIndicies ArbitrarySize [ default fingerprints ]
191 \& EStateIndicies FixedSize
192 .Ve
193 .PP
194 Example of \fI\s-1SD\s0\fR file containing E\-state indicies fingerprints string data:
195 .PP
196 .Vb 10
197 \& ... ...
198 \& ... ...
199 \& $$$$
200 \& ... ...
201 \& ... ...
202 \& ... ...
203 \& 41 44 0 0 0 0 0 0 0 0999 V2000
204 \& \-3.3652 1.4499 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
205 \& ... ...
206 \& 2 3 1 0 0 0 0
207 \& ... ...
208 \& M END
209 \& > <CmpdID>
210 \& Cmpd1
211 \&
212 \& > <EStateIndiciesFingerprints>
213 \& FingerprintsVector;EStateIndicies:ArbitrarySize;11;NumericalValues;IDsA
214 \& ndValuesString;SaaCH SaasC SaasN SdO SdssC SsCH3 SsF SsOH SssCH2 SssNH
215 \& SsssCH;24.778 4.387 1.993 25.023 \-1.435 3.975 14.006 29.759 \-0.073 3.02
216 \& 4 \-2.270
217 \&
218 \& $$$$
219 \& ... ...
220 \& ... ...
221 .Ve
222 .PP
223 Example of \fI\s-1FP\s0\fR file containing E\-state indicies fingerprints string data:
224 .PP
225 .Vb 10
226 \& #
227 \& # Package = MayaChemTools 7.4
228 \& # Release Date = Oct 21, 2010
229 \& #
230 \& # TimeStamp = Fri Mar 11 14:35:11 2011
231 \& #
232 \& # FingerprintsStringType = FingerprintsVector
233 \& #
234 \& # Description = EStateIndicies:ArbitrarySize
235 \& # VectorStringFormat = IDsAndValuesString
236 \& # VectorValuesType = NumericalValues
237 \& #
238 \& Cmpd1 11;SaaCH SaasC SaasN SdO SdssC...;24.778 4.387 1.993 25.023 \-1...
239 \& Cmpd2 9;SdNH SdO SdssC SsCH3 SsNH...;7.418 22.984 \-1.583 5.387 5.400...
240 \& ... ...
241 \& ... ..
242 .Ve
243 .PP
244 Example of \s-1CSV\s0 \fIText\fR file containing E\-state indicies fingerprints string data:
245 .PP
246 .Vb 10
247 \& "CompoundID","EStateIndiciesFingerprints"
248 \& "Cmpd1","FingerprintsVector;EStateIndicies:ArbitrarySize;11;NumericalVa
249 \& lues;IDsAndValuesString;SaaCH SaasC SaasN SdO SdssC SsCH3 SsF SsOH SssC
250 \& H2 SssNH SsssCH;24.778 4.387 1.993 25.023 \-1.435 3.975 14.006 29.759 \-0
251 \& .073 3.024 \-2.270"
252 \& "Cmpd2","FingerprintsVector;EStateIndicies:ArbitrarySize;9;NumericalVal
253 \& ues;IDsAndValuesString;SdNH SdO SdssC SsCH3 SsNH2 SsOH SssCH2 SssNH Sss
254 \& sCH;7.418 22.984 \-1.583 5.387 5.400 19.852 1.737 5.624 \-3.319"
255 \& ... ...
256 \& ... ...
257 .Ve
258 .PP
259 The current release of MayaChemTools generates the following types of E\-state
260 fingerprints vector strings:
261 .PP
262 .Vb 4
263 \& FingerprintsVector;EStateIndicies:ArbitrarySize;11;NumericalValues;IDs
264 \& AndValuesString;SaaCH SaasC SaasN SdO SdssC SsCH3 SsF SsOH SssCH2 SssN
265 \& H SsssCH;24.778 4.387 1.993 25.023 \-1.435 3.975 14.006 29.759 \-0.073 3
266 \& .024 \-2.270
267 \&
268 \& FingerprintsVector;EStateIndicies:FixedSize;87;OrderedNumericalValues;
269 \& ValuesString;0 0 0 0 0 0 0 3.975 0 \-0.073 0 0 24.778 \-2.270 0 0 \-1.435
270 \& 4.387 0 0 0 0 0 0 3.024 0 0 0 0 0 0 0 1.993 0 29.759 25.023 0 0 0 0 1
271 \& 4.006 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0
272 \& 0 0 0 0 0 0 0 0 0 0 0 0 0 0
273 \&
274 \& FingerprintsVector;EStateIndicies:FixedSize;87;OrderedNumericalValues;
275 \& IDsAndValuesString;SsLi SssBe SssssBem SsBH2 SssBH SsssB SssssBm SsCH3
276 \& SdCH2 SssCH2 StCH SdsCH SaaCH SsssCH SddC StsC SdssC SaasC SaaaC Sssss
277 \& C SsNH3p SsNH2 SssNH2p SdNH SssNH SaaNH StN SsssNHp SdsN SaaN SsssN Sd
278 \& 0 0 0 0 0 0 0 3.975 0 \-0.073 0 0 24.778 \-2.270 0 0 \-1.435 4.387 0 0 0
279 \& 0 0 0 3.024 0 0 0 0 0 0 0 1.993 0 29.759 25.023 0 0 0 0 14.006 0 0 0 0
280 \& 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0...
281 .Ve
282 .SH "OPTIONS"
283 .IX Header "OPTIONS"
284 .IP "\fB\-\-AromaticityModel\fR \fIMDLAromaticityModel | TriposAromaticityModel | MMFFAromaticityModel | ChemAxonBasicAromaticityModel | ChemAxonGeneralAromaticityModel | DaylightAromaticityModel | MayaChemToolsAromaticityModel\fR" 4
285 .IX Item "--AromaticityModel MDLAromaticityModel | TriposAromaticityModel | MMFFAromaticityModel | ChemAxonBasicAromaticityModel | ChemAxonGeneralAromaticityModel | DaylightAromaticityModel | MayaChemToolsAromaticityModel"
286 Specify aromaticity model to use during detection of aromaticity. Possible values in the current
287 release are: \fIMDLAromaticityModel, TriposAromaticityModel, MMFFAromaticityModel,
288 ChemAxonBasicAromaticityModel, ChemAxonGeneralAromaticityModel, DaylightAromaticityModel
289 or MayaChemToolsAromaticityModel\fR. Default value: \fIMayaChemToolsAromaticityModel\fR.
290 .Sp
291 The supported aromaticity model names along with model specific control parameters
292 are defined in \fBAromaticityModelsData.csv\fR, which is distributed with the current release
293 and is available under \fBlib/data\fR directory. \fBMolecule.pm\fR module retrieves data from
294 this file during class instantiation and makes it available to method \fBDetectAromaticity\fR
295 for detecting aromaticity corresponding to a specific model.
296 .IP "\fB\-\-CompoundID\fR \fIDataFieldName or LabelPrefixString\fR" 4
297 .IX Item "--CompoundID DataFieldName or LabelPrefixString"
298 This value is \fB\-\-CompoundIDMode\fR specific and indicates how compound \s-1ID\s0 is generated.
299 .Sp
300 For \fIDataField\fR value of \fB\-\-CompoundIDMode\fR option, it corresponds to datafield label name
301 whose value is used as compound \s-1ID\s0; otherwise, it's a prefix string used for generating compound
302 IDs like LabelPrefixString<Number>. Default value, \fICmpd\fR, generates compound IDs which
303 look like Cmpd<Number>.
304 .Sp
305 Examples for \fIDataField\fR value of \fB\-\-CompoundIDMode\fR:
306 .Sp
307 .Vb 2
308 \& MolID
309 \& ExtReg
310 .Ve
311 .Sp
312 Examples for \fILabelPrefix\fR or \fIMolNameOrLabelPrefix\fR value of \fB\-\-CompoundIDMode\fR:
313 .Sp
314 .Vb 1
315 \& Compound
316 .Ve
317 .Sp
318 The value specified above generates compound IDs which correspond to Compound<Number>
319 instead of default value of Cmpd<Number>.
320 .IP "\fB\-\-CompoundIDLabel\fR \fItext\fR" 4
321 .IX Item "--CompoundIDLabel text"
322 Specify compound \s-1ID\s0 column label for \s-1FP\s0 or \s-1CSV/TSV\s0 text file(s) used during \fICompoundID\fR value
323 of \fB\-\-DataFieldsMode\fR option. Default: \fICompoundID\fR.
324 .IP "\fB\-\-CompoundIDMode\fR \fIDataField | MolName | LabelPrefix | MolNameOrLabelPrefix\fR" 4
325 .IX Item "--CompoundIDMode DataField | MolName | LabelPrefix | MolNameOrLabelPrefix"
326 Specify how to generate compound IDs and write to \s-1FP\s0 or \s-1CSV/TSV\s0 text file(s) along with generated
327 fingerprints for \fI\s-1FP\s0 | text | all\fR values of \fB\-\-output\fR option: use a \fISDFile(s)\fR datafield value;
328 use molname line from \fISDFile(s)\fR; generate a sequential \s-1ID\s0 with specific prefix; use combination
329 of both MolName and LabelPrefix with usage of LabelPrefix values for empty molname lines.
330 .Sp
331 Possible values: \fIDataField | MolName | LabelPrefix | MolNameOrLabelPrefix\fR.
332 Default: \fILabelPrefix\fR.
333 .Sp
334 For \fIMolNameAndLabelPrefix\fR value of \fB\-\-CompoundIDMode\fR, molname line in \fISDFile(s)\fR takes
335 precedence over sequential compound IDs generated using \fILabelPrefix\fR and only empty molname
336 values are replaced with sequential compound IDs.
337 .Sp
338 This is only used for \fICompoundID\fR value of \fB\-\-DataFieldsMode\fR option.
339 .ie n .IP "\fB\-\-DataFields\fR \fI""FieldLabel1,FieldLabel2,...""\fR" 4
340 .el .IP "\fB\-\-DataFields\fR \fI``FieldLabel1,FieldLabel2,...''\fR" 4
341 .IX Item "--DataFields FieldLabel1,FieldLabel2,..."
342 Comma delimited list of \fISDFiles(s)\fR data fields to extract and write to \s-1CSV/TSV\s0 text file(s) along
343 with generated fingerprints for \fItext | all\fR values of \fB\-\-output\fR option.
344 .Sp
345 This is only used for \fISpecify\fR value of \fB\-\-DataFieldsMode\fR option.
346 .Sp
347 Examples:
348 .Sp
349 .Vb 2
350 \& Extreg
351 \& MolID,CompoundName
352 .Ve
353 .IP "\fB\-d, \-\-DataFieldsMode\fR \fIAll | Common | Specify | CompoundID\fR" 4
354 .IX Item "-d, --DataFieldsMode All | Common | Specify | CompoundID"
355 Specify how data fields in \fISDFile(s)\fR are transferred to output \s-1CSV/TSV\s0 text file(s) along
356 with generated fingerprints for \fItext | all\fR values of \fB\-\-output\fR option: transfer all \s-1SD\s0
357 data field; transfer \s-1SD\s0 data files common to all compounds; extract specified data fields;
358 generate a compound \s-1ID\s0 using molname line, a compound prefix, or a combination of both.
359 Possible values: \fIAll | Common | specify | CompoundID\fR. Default value: \fICompoundID\fR.
360 .IP "\fB\-e, \-\-EStateAtomTypesSetToUse\fR \fIArbitrarySize | FixedSize\fR" 4
361 .IX Item "-e, --EStateAtomTypesSetToUse ArbitrarySize | FixedSize"
362 E\-state atom types set size to use during generation of E\-state indicies fingerprints.
363 Possible values: \fIArbitrarySize | FixedSize\fR; Default value: \fIArbitrarySize\fR.
364 .Sp
365 \&\fIArbitrarySize\fR corrresponds to only E\-state atom types detected in molecule; \fIFixedSize\fR
366 corresponds to fixed number of previously defined E\-state atom types.
367 .Sp
368 For \fIEStateIndicies\fR, a fingerprint vector string is generated. The vector string corresponding to
369 \&\fIEStateIndicies\fR contains sum of E\-state values for E\-state atom types.
370 .Sp
371 Module \fBAtomTypes::EStateAtomTypes.pm\fR is used to assign E\-state atom types to
372 non-hydrogen atoms in the molecule which is able to assign atom types to any valid
373 atom group. However, for \fIFixedSize\fR value of \fBEStateAtomTypesSetToUse\fR,
374 only a fixed set of E\-state atom types corresponding to specific atom groups [ Appendix
375 \&\s-1III\s0 in Ref 77 ] are used for fingerprints.
376 .Sp
377 The fixed size E\-state atom type set size used during generation of fingerprints contains
378 87 E\-state non-hydrogen atom types in EStateAtomTypes.csv data file distributed with
379 MayaChemTools.
380 .IP "\fB\-f, \-\-Filter\fR \fIYes | No\fR" 4
381 .IX Item "-f, --Filter Yes | No"
382 Specify whether to check and filter compound data in SDFile(s). Possible values: \fIYes or No\fR.
383 Default value: \fIYes\fR.
384 .Sp
385 By default, compound data is checked before calculating fingerprints and compounds containing
386 atom data corresponding to non-element symbols or no atom data are ignored.
387 .IP "\fB\-\-FingerprintsLabelMode\fR \fIFingerprintsLabelOnly | FingerprintsLabelWithIDs\fR" 4
388 .IX Item "--FingerprintsLabelMode FingerprintsLabelOnly | FingerprintsLabelWithIDs"
389 Specify how fingerprints label is generated in conjunction with \fB\-\-FingerprintsLabel\fR option value:
390 use fingerprints label generated only by \fB\-\-FingerprintsLabel\fR option value or append E\-state
391 atom type value IDs to \fB\-\-FingerprintsLabel\fR option value.
392 .Sp
393 Possible values: \fIFingerprintsLabelOnly | FingerprintsLabelWithIDs\fR. Default value:
394 \&\fIFingerprintsLabelOnly\fR.
395 .Sp
396 This option is only used for \fIFixedSize\fR value of \fB\-e, \-\-EStateAtomTypesSetToUse\fR option during
397 generation of \fIEStateIndicies\fR E\-state fingerprints.
398 .Sp
399 E\-state atom type IDs appended to \fB\-\-FingerprintsLabel\fR value during \fIFingerprintsLabelWithIDs\fR
400 values of \fB\-\-FingerprintsLabelMode\fR correspond to fixed number of previously defined E\-state
401 atom types.
402 .IP "\fB\-\-FingerprintsLabel\fR \fItext\fR" 4
403 .IX Item "--FingerprintsLabel text"
404 \&\s-1SD\s0 data label or text file column label to use for fingerprints string in output \s-1SD\s0 or
405 \&\s-1CSV/TSV\s0 text file(s) specified by \fB\-\-output\fR. Default value: \fIEStateIndiciesFingerprints\fR.
406 .IP "\fB\-h, \-\-help\fR" 4
407 .IX Item "-h, --help"
408 Print this help message.
409 .IP "\fB\-k, \-\-KeepLargestComponent\fR \fIYes | No\fR" 4
410 .IX Item "-k, --KeepLargestComponent Yes | No"
411 Generate fingerprints for only the largest component in molecule. Possible values:
412 \&\fIYes or No\fR. Default value: \fIYes\fR.
413 .Sp
414 For molecules containing multiple connected components, fingerprints can be generated
415 in two different ways: use all connected components or just the largest connected
416 component. By default, all atoms except for the largest connected component are
417 deleted before generation of fingerprints.
418 .IP "\fB\-\-OutDelim\fR \fIcomma | tab | semicolon\fR" 4
419 .IX Item "--OutDelim comma | tab | semicolon"
420 Delimiter for output \s-1CSV/TSV\s0 text file(s). Possible values: \fIcomma, tab, or semicolon\fR
421 Default value: \fIcomma\fR.
422 .IP "\fB\-\-output\fR \fI\s-1SD\s0 | \s-1FP\s0 | text | all\fR" 4
423 .IX Item "--output SD | FP | text | all"
424 Type of output files to generate. Possible values: \fI\s-1SD\s0, \s-1FP\s0, text, or all\fR. Default value: \fItext\fR.
425 .IP "\fB\-o, \-\-overwrite\fR" 4
426 .IX Item "-o, --overwrite"
427 Overwrite existing files.
428 .IP "\fB\-q, \-\-quote\fR \fIYes | No\fR" 4
429 .IX Item "-q, --quote Yes | No"
430 Put quote around column values in output \s-1CSV/TSV\s0 text file(s). Possible values:
431 \&\fIYes or No\fR. Default value: \fIYes\fR.
432 .IP "\fB\-r, \-\-root\fR \fIRootName\fR" 4
433 .IX Item "-r, --root RootName"
434 New file name is generated using the root: <Root>.<Ext>. Default for new file
435 names: <SDFileName><EStateIndiciesFP>.<Ext>. The file type determines <Ext> value.
436 The sdf, fpf, csv, and tsv <Ext> values are used for \s-1SD\s0, \s-1FP\s0, comma/semicolon, and tab
437 delimited text files, respectively.This option is ignored for multiple input files.
438 .IP "\fB\-\-ValuesPrecision\fR \fInumber\fR" 4
439 .IX Item "--ValuesPrecision number"
440 Precision of values for E\-state indicies option. Default value: up to \fI3\fR decimal places.
441 Valid values: positive integers.
442 .IP "\fB\-v, \-\-VectorStringFormat\fR \fIValuesString | IDsAndValuesString | IDsAndValuesPairsString | ValuesAndIDsString | ValuesAndIDsPairsString\fR" 4
443 .IX Item "-v, --VectorStringFormat ValuesString | IDsAndValuesString | IDsAndValuesPairsString | ValuesAndIDsString | ValuesAndIDsPairsString"
444 Format of fingerprints vector string data in output \s-1SD\s0, \s-1FP\s0 or \s-1CSV/TSV\s0 text file(s) specified by
445 \&\fB\-\-output\fR used for \fIEStateIndicies\fR. Possible values: \fIValuesString, IDsAndValuesString,
446 IDsAndValuesPairsString, ValuesAndIDsString, ValuesAndIDsPairsString\fR.
447 .Sp
448 Default value during \fIArbitrarySize\fR value of \fB\-e, \-\-EStateAtomTypesSetToUse\fR
449 option: \fIIDsAndValuesString\fR. Default value during \fIFixedSize\fR value of
450 \&\fB\-e, \-\-EStateAtomTypesSetToUse\fR option: \fIValuesString\fR.
451 .Sp
452 Examples:
453 .Sp
454 .Vb 4
455 \& FingerprintsVector;EStateIndicies:ArbitrarySize;11;NumericalValues;IDs
456 \& AndValuesString;SaaCH SaasC SaasN SdO SdssC SsCH3 SsF SsOH SssCH2 SssN
457 \& H SsssCH;24.778 4.387 1.993 25.023 \-1.435 3.975 14.006 29.759 \-0.073 3
458 \& .024 \-2.270
459 .Ve
460 .IP "\fB\-w, \-\-WorkingDir\fR \fIDirName\fR" 4
461 .IX Item "-w, --WorkingDir DirName"
462 Location of working directory. Default: current directory.
463 .SH "EXAMPLES"
464 .IX Header "EXAMPLES"
465 To generate E\-state fingerprints of arbitrary size in vector string format and create a
466 SampleESFP.csv file containing sequential compound IDs along with fingerprints
467 vector strings data, type:
468 .PP
469 .Vb 1
470 \& % EStateIndiciesFingerprints.pl \-r SampleESFP \-o Sample.sdf
471 .Ve
472 .PP
473 To generate E\-state fingerprints of fixed size in vector string format and create a
474 SampleESFP.csv file containing sequential compound IDs along with fingerprints
475 vector strings data, type:
476 .PP
477 .Vb 2
478 \& % EStateIndiciesFingerprints.pl \-e FixedSize \-r SampleESFP
479 \& \-o Sample.sdf
480 .Ve
481 .PP
482 To generate E\-state fingerprints of fixed size in vector string with IDsAndValues
483 format and create a SampleESFP.csv file containing sequential compound IDs
484 along with fingerprints vector strings data, type:
485 .PP
486 .Vb 2
487 \& % EStateIndiciesFingerprints.pl \-e FixedSize \-v IDsAndValuesString
488 \& \-r SampleESFP \-o Sample.sdf
489 .Ve
490 .PP
491 To generate E\-state fingerprints of fixed size in vector string format
492 and create a SampleESFP.csv file containing compound \s-1ID\s0 from molecule
493 name line along with fingerprints vector strings data, type
494 .PP
495 .Vb 3
496 \& % EStateIndiciesFingerprints.pl \-e FixedSize
497 \& \-\-DataFieldsMode CompoundID \-\-CompoundIDMode MolName
498 \& \-r SampleESFP \-o Sample.sdf
499 .Ve
500 .PP
501 To generate E\-state fingerprints of fixed size in vector string format
502 and create a SampleESFP.csv file containing compound IDs using specified
503 data field along with fingerprints vector strings data, type:
504 .PP
505 .Vb 3
506 \& % EStateIndiciesFingerprints.pl \-e FixedSize
507 \& \-\-DataFieldsMode CompoundID \-\-CompoundIDMode DataField \-\-CompoundID
508 \& Mol_ID \-r SampleESFP \-o Sample.sdf
509 .Ve
510 .PP
511 To generate E\-state fingerprints of fixed size in vector string format
512 and create a SampleESFP.csv file containing compound \s-1ID\s0 using combination
513 of molecule name line and an explicit compound prefix along with fingerprints vector
514 strings data, type:
515 .PP
516 .Vb 3
517 \& % EStateIndiciesFingerprints.pl \-e FixedSize
518 \& \-\-DataFieldsMode CompoundID \-\-CompoundIDMode MolnameOrLabelPrefix
519 \& \-\-CompoundID Cmpd \-\-CompoundIDLabel MolID \-r SampleESFP \-o Sample.sdf
520 .Ve
521 .PP
522 To generate E\-state fingerprints of fixed size in vector string format
523 and create a SampleESFP.csv file containing specific data fields columns along
524 with fingerprints vector strings data, type:
525 .PP
526 .Vb 3
527 \& % EStateIndiciesFingerprints.pl \-e FixedSize
528 \& \-\-DataFieldsMode Specify \-\-DataFields Mol_ID \-r SampleESFP
529 \& \-o Sample.sdf
530 .Ve
531 .PP
532 To generate E\-state fingerprints of fixed size in vector string format
533 and create a SampleESFP.csv file containing common data fields columns along
534 with fingerprints vector strings data, type:
535 .PP
536 .Vb 2
537 \& % EStateIndiciesFingerprints.pl \-e FixedSize
538 \& \-\-DataFieldsMode Common \-r SampleESFP \-o Sample.sdf
539 .Ve
540 .PP
541 To generate E\-state fingerprints of fixed size in vector string format and create
542 SampleESFP.sdf, SampleESFP.fpf, and SampleESFP.csv files containing all data
543 fields columns in \s-1CSV\s0 file along with fingerprints vector strings data, type:
544 .PP
545 .Vb 2
546 \& % EStateIndiciesFingerprints.pl \-e FixedSize
547 \& \-\-DataFieldsMode All \-\-output all \-r SampleESFP \-o Sample.sdf
548 .Ve
549 .SH "AUTHOR"
550 .IX Header "AUTHOR"
551 Manish Sud <msud@san.rr.com>
552 .SH "SEE ALSO"
553 .IX Header "SEE ALSO"
554 InfoFingerprintsFiles.pl, SimilarityMatricesFingerprints.pl, AtomNeighborhoodsFingerprints.pl,
555 ExtendedConnectivityFingerprints.pl, MACCSKeysFingeprints.pl, PathLengthFingerprints.pl,
556 TopologicalAtomPairsFingerprints.pl, TopologicalAtomTorsionsFingerprints.pl,
557 TopologicalPharmacophoreAtomPairsFingerprints.pl, TopologicalPharmacophoreAtomTripletsFingerprints.pl
558 .SH "COPYRIGHT"
559 .IX Header "COPYRIGHT"
560 Copyright (C) 2015 Manish Sud. All rights reserved.
561 .PP
562 This file is part of MayaChemTools.
563 .PP
564 MayaChemTools is free software; you can redistribute it and/or modify it under
565 the terms of the \s-1GNU\s0 Lesser General Public License as published by the Free
566 Software Foundation; either version 3 of the License, or (at your option)
567 any later version.