comparison docs/scripts/man1/TopologicalAtomTripletsFingerprints.1 @ 0:4816e4a8ae95 draft default tip

Uploaded
author deepakjadmin
date Wed, 20 Jan 2016 09:23:18 -0500
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:4816e4a8ae95
1 .\" Automatically generated by Pod::Man 2.25 (Pod::Simple 3.22)
2 .\"
3 .\" Standard preamble:
4 .\" ========================================================================
5 .de Sp \" Vertical space (when we can't use .PP)
6 .if t .sp .5v
7 .if n .sp
8 ..
9 .de Vb \" Begin verbatim text
10 .ft CW
11 .nf
12 .ne \\$1
13 ..
14 .de Ve \" End verbatim text
15 .ft R
16 .fi
17 ..
18 .\" Set up some character translations and predefined strings. \*(-- will
19 .\" give an unbreakable dash, \*(PI will give pi, \*(L" will give a left
20 .\" double quote, and \*(R" will give a right double quote. \*(C+ will
21 .\" give a nicer C++. Capital omega is used to do unbreakable dashes and
22 .\" therefore won't be available. \*(C` and \*(C' expand to `' in nroff,
23 .\" nothing in troff, for use with C<>.
24 .tr \(*W-
25 .ds C+ C\v'-.1v'\h'-1p'\s-2+\h'-1p'+\s0\v'.1v'\h'-1p'
26 .ie n \{\
27 . ds -- \(*W-
28 . ds PI pi
29 . if (\n(.H=4u)&(1m=24u) .ds -- \(*W\h'-12u'\(*W\h'-12u'-\" diablo 10 pitch
30 . if (\n(.H=4u)&(1m=20u) .ds -- \(*W\h'-12u'\(*W\h'-8u'-\" diablo 12 pitch
31 . ds L" ""
32 . ds R" ""
33 . ds C` ""
34 . ds C' ""
35 'br\}
36 .el\{\
37 . ds -- \|\(em\|
38 . ds PI \(*p
39 . ds L" ``
40 . ds R" ''
41 'br\}
42 .\"
43 .\" Escape single quotes in literal strings from groff's Unicode transform.
44 .ie \n(.g .ds Aq \(aq
45 .el .ds Aq '
46 .\"
47 .\" If the F register is turned on, we'll generate index entries on stderr for
48 .\" titles (.TH), headers (.SH), subsections (.SS), items (.Ip), and index
49 .\" entries marked with X<> in POD. Of course, you'll have to process the
50 .\" output yourself in some meaningful fashion.
51 .ie \nF \{\
52 . de IX
53 . tm Index:\\$1\t\\n%\t"\\$2"
54 ..
55 . nr % 0
56 . rr F
57 .\}
58 .el \{\
59 . de IX
60 ..
61 .\}
62 .\"
63 .\" Accent mark definitions (@(#)ms.acc 1.5 88/02/08 SMI; from UCB 4.2).
64 .\" Fear. Run. Save yourself. No user-serviceable parts.
65 . \" fudge factors for nroff and troff
66 .if n \{\
67 . ds #H 0
68 . ds #V .8m
69 . ds #F .3m
70 . ds #[ \f1
71 . ds #] \fP
72 .\}
73 .if t \{\
74 . ds #H ((1u-(\\\\n(.fu%2u))*.13m)
75 . ds #V .6m
76 . ds #F 0
77 . ds #[ \&
78 . ds #] \&
79 .\}
80 . \" simple accents for nroff and troff
81 .if n \{\
82 . ds ' \&
83 . ds ` \&
84 . ds ^ \&
85 . ds , \&
86 . ds ~ ~
87 . ds /
88 .\}
89 .if t \{\
90 . ds ' \\k:\h'-(\\n(.wu*8/10-\*(#H)'\'\h"|\\n:u"
91 . ds ` \\k:\h'-(\\n(.wu*8/10-\*(#H)'\`\h'|\\n:u'
92 . ds ^ \\k:\h'-(\\n(.wu*10/11-\*(#H)'^\h'|\\n:u'
93 . ds , \\k:\h'-(\\n(.wu*8/10)',\h'|\\n:u'
94 . ds ~ \\k:\h'-(\\n(.wu-\*(#H-.1m)'~\h'|\\n:u'
95 . ds / \\k:\h'-(\\n(.wu*8/10-\*(#H)'\z\(sl\h'|\\n:u'
96 .\}
97 . \" troff and (daisy-wheel) nroff accents
98 .ds : \\k:\h'-(\\n(.wu*8/10-\*(#H+.1m+\*(#F)'\v'-\*(#V'\z.\h'.2m+\*(#F'.\h'|\\n:u'\v'\*(#V'
99 .ds 8 \h'\*(#H'\(*b\h'-\*(#H'
100 .ds o \\k:\h'-(\\n(.wu+\w'\(de'u-\*(#H)/2u'\v'-.3n'\*(#[\z\(de\v'.3n'\h'|\\n:u'\*(#]
101 .ds d- \h'\*(#H'\(pd\h'-\w'~'u'\v'-.25m'\f2\(hy\fP\v'.25m'\h'-\*(#H'
102 .ds D- D\\k:\h'-\w'D'u'\v'-.11m'\z\(hy\v'.11m'\h'|\\n:u'
103 .ds th \*(#[\v'.3m'\s+1I\s-1\v'-.3m'\h'-(\w'I'u*2/3)'\s-1o\s+1\*(#]
104 .ds Th \*(#[\s+2I\s-2\h'-\w'I'u*3/5'\v'-.3m'o\v'.3m'\*(#]
105 .ds ae a\h'-(\w'a'u*4/10)'e
106 .ds Ae A\h'-(\w'A'u*4/10)'E
107 . \" corrections for vroff
108 .if v .ds ~ \\k:\h'-(\\n(.wu*9/10-\*(#H)'\s-2\u~\d\s+2\h'|\\n:u'
109 .if v .ds ^ \\k:\h'-(\\n(.wu*10/11-\*(#H)'\v'-.4m'^\v'.4m'\h'|\\n:u'
110 . \" for low resolution devices (crt and lpr)
111 .if \n(.H>23 .if \n(.V>19 \
112 \{\
113 . ds : e
114 . ds 8 ss
115 . ds o a
116 . ds d- d\h'-1'\(ga
117 . ds D- D\h'-1'\(hy
118 . ds th \o'bp'
119 . ds Th \o'LP'
120 . ds ae ae
121 . ds Ae AE
122 .\}
123 .rm #[ #] #H #V #F C
124 .\" ========================================================================
125 .\"
126 .IX Title "TOPOLOGICALATOMTRIPLETSFINGERPRINTS 1"
127 .TH TOPOLOGICALATOMTRIPLETSFINGERPRINTS 1 "2015-03-29" "perl v5.14.2" "MayaChemTools"
128 .\" For nroff, turn off justification. Always turn off hyphenation; it makes
129 .\" way too many mistakes in technical documents.
130 .if n .ad l
131 .nh
132 .SH "NAME"
133 TopologicalAtomTripletsFingerprints.pl \- Generate topological atom triplets fingerprints for SD files
134 .SH "SYNOPSIS"
135 .IX Header "SYNOPSIS"
136 TopologicalAtomTripletsFingerprints.pl SDFile(s)...
137 .PP
138 TopologicalAtomTripletsFingerprints.pl [\fB\-\-AromaticityModel\fR \fIAromaticityModelType\fR]
139 [\fB\-a, \-\-AtomIdentifierType\fR \fIAtomicInvariantsAtomTypes\fR]
140 [\fB\-\-AtomicInvariantsToUse\fR \fI\*(L"AtomicInvariant,AtomicInvariant...\*(R"\fR]
141 [\fB\-\-FunctionalClassesToUse\fR \fI\*(L"FunctionalClass1,FunctionalClass2...\*(R"\fR]
142 [\fB\-\-CompoundID\fR \fIDataFieldName or LabelPrefixString\fR] [\fB\-\-CompoundIDLabel\fR \fItext\fR]
143 [\fB\-\-CompoundIDMode\fR] [\fB\-\-DataFields\fR \fI\*(L"FieldLabel1,FieldLabel2,...\*(R"\fR]
144 [\fB\-d, \-\-DataFieldsMode\fR \fIAll | Common | Specify | CompoundID\fR] [\fB\-f, \-\-Filter\fR \fIYes | No\fR]
145 [\fB\-\-FingerprintsLabel\fR \fItext\fR] [\fB\-h, \-\-help\fR] [\fB\-k, \-\-KeepLargestComponent\fR \fIYes | No\fR]
146 [\fB\-\-MinDistance\fR \fInumber\fR] [\fB\-\-MaxDistance\fR \fInumber\fR]
147 [\fB\-\-OutDelim\fR \fIcomma | tab | semicolon\fR] [\fB\-\-output\fR \fI\s-1SD\s0 | \s-1FP\s0 | text | all\fR] [\fB\-o, \-\-overwrite\fR]
148 [\fB\-q, \-\-quote\fR \fIYes | No\fR] [\fB\-r, \-\-root\fR \fIRootName\fR] [\fB\-u, \-\-UseTriangleInequality\fR \fIYes | No\fR]
149 [\fB\-v, \-\-VectorStringFormat\fR \fIValuesString, IDsAndValuesString | IDsAndValuesPairsString | ValuesAndIDsString | ValuesAndIDsPairsString\fR]
150 [\fB\-w, \-\-WorkingDir\fR dirname] SDFile(s)...
151 .SH "DESCRIPTION"
152 .IX Header "DESCRIPTION"
153 Generate topological atom triplets fingerprints for \fISDFile(s)\fR and create
154 appropriate \s-1SD\s0, \s-1FP\s0 or \s-1CSV/TSV\s0 text file(s) containing fingerprints vector strings corresponding to
155 molecular fingerprints.
156 .PP
157 Multiple SDFile names are separated by spaces. The valid file extensions are \fI.sdf\fR
158 and \fI.sd\fR. All other file names are ignored. All the \s-1SD\s0 files in a current directory
159 can be specified either by \fI*.sdf\fR or the current directory name.
160 .PP
161 The current release of MayaChemTools supports generation of topological atom triplets
162 fingerprints corresponding to following \fB\-a, \-\-AtomIdentifierTypes\fR:
163 .PP
164 .Vb 3
165 \& AtomicInvariantsAtomTypes, DREIDINGAtomTypes, EStateAtomTypes,
166 \& FunctionalClassAtomTypes, MMFF94AtomTypes, SLogPAtomTypes,
167 \& SYBYLAtomTypes, TPSAAtomTypes, UFFAtomTypes
168 .Ve
169 .PP
170 Based on the values specified for \fB\-a, \-\-AtomIdentifierType\fR and \fB\-\-AtomicInvariantsToUse\fR,
171 initial atom types are assigned to all non-hydrogen atoms in a molecule. Using the distance
172 matrix for the molecule and initial atom types assigned to non-hydrogen atoms, all unique atom
173 pairs within \fB\-\-MinDistance\fR and \fB\-\-MaxDistance\fR are identified and counted. An atom triplet
174 identifier is generated for each unique atom triplet; the format of the atom triplet identifier is:
175 .PP
176 .Vb 1
177 \& <ATx>\-Dyz\-<ATy>\-Dxz\-<ATz>\-Dxy
178 \&
179 \& ATx, ATy, ATz: Atom types assigned to atom x, atom y, and atom z
180 \& Dxy: Distance between atom x and atom y
181 \& Dxz: Distance between atom x and atom z
182 \& Dyz: Distance between atom y and atom z
183 \&
184 \& where <AT1>\-D23 <= <AT2>\-D13 <= <AT3>\-D12
185 .Ve
186 .PP
187 The atom triplet identifiers for all unique atom triplets corresponding to non-hydrogen atoms constitute
188 topological atom triplets fingerprints of the molecule.
189 .PP
190 Example of \fI\s-1SD\s0\fR file containing topological atom triplets fingerprints string data:
191 .PP
192 .Vb 10
193 \& ... ...
194 \& ... ...
195 \& $$$$
196 \& ... ...
197 \& ... ...
198 \& ... ...
199 \& 41 44 0 0 0 0 0 0 0 0999 V2000
200 \& \-3.3652 1.4499 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
201 \& ... ...
202 \& 2 3 1 0 0 0 0
203 \& ... ...
204 \& M END
205 \& > <CmpdID>
206 \& Cmpd1
207 \&
208 \& > <TopologicalAtomTripletsFingerprints>
209 \& FingerprintsVector;TopologicalAtomTriplets:AtomicInvariantsAtomTypes:Mi
210 \& nDistance1:MaxDistance10;3096;NumericalValues;IDsAndValuesString;C.X1.B
211 \& O1.H3\-D1\-C.X1.BO1.H3\-D1\-C.X3.BO3.H1\-D2 C.X1.BO1.H3\-D1\-C.X2.BO2.H2\-D10\-C
212 \& .X3.BO4\-D9 C.X1.BO1.H3\-D1\-C.X2.BO2.H2\-D3\-N.X3.BO3\-D4 C.X1.BO1.H3\-D1...;
213 \& 1 2 2 2 2 2 2 2 8 8 4 8 4 4 2 2 2 2 4 2 2 2 4 2 2 2 2 1 2 2 4 4 4 2 2 2
214 \& 4 4 4 8 4 4 2 4 4 4 2 4 4 2 2 2 2 2 2 2 2 1 2 2 2 2 2 2 2 2 2 2 8 8 ...
215 \&
216 \& $$$$
217 \& ... ...
218 \& ... ...
219 .Ve
220 .PP
221 Example of \fI\s-1FP\s0\fR file containing topological atom triplets fingerprints string data:
222 .PP
223 .Vb 10
224 \& #
225 \& # Package = MayaChemTools 7.4
226 \& # Release Date = Oct 21, 2010
227 \& #
228 \& # TimeStamp = Fri Mar 11 15:24:01 2011
229 \& #
230 \& # FingerprintsStringType = FingerprintsVector
231 \& #
232 \& # Description = TopologicalAtomTriplets:AtomicInvariantsAtomTypes:Mi...
233 \& # VectorStringFormat = IDsAndValuesString
234 \& # VectorValuesType = NumericalValues
235 \& #
236 \& Cmpd1 3096;C.X1.BO1.H3\-D1\-C.X1.BO1.H3\-D1\-C.X3.BO3.H1\-D2...;1 2 2 2 2...
237 \& Cmpd2 1093;C.X1.BO1.H3\-D1\-C.X1.BO1.H3\-D3\-C.X2.BO2.H2\-D4...;2 2 2 2 2...
238 \& ... ...
239 \& ... ..
240 .Ve
241 .PP
242 Example of \s-1CSV\s0 \fIText\fR file containing topological atom triplets fingerprints string data:
243 .PP
244 .Vb 9
245 \& "CompoundID","TopologicalAtomTripletsFingerprints"
246 \& "Cmpd1","FingerprintsVector;TopologicalAtomTriplets:AtomicInvariantsAto
247 \& mTypes:MinDistance1:MaxDistance10;3096;NumericalValues;IDsAndValuesStri
248 \& ng;C.X1.BO1.H3\-D1\-C.X1.BO1.H3\-D1\-C.X3.BO3.H1\-D2 C.X1.BO1.H3\-D1\-C.X2.BO2
249 \& .H2\-D10\-C.X3.BO4\-D9 C.X1.BO1.H3\-D1\-C.X2.BO2.H2\-D3\-N.X3.BO3\-D4 C.X1....;
250 \& 1 2 2 2 2 2 2 2 8 8 4 8 4 4 2 2 2 2 4 2 2 2 4 2 2 2 2 1 2 2 4 4 4 2 2 2
251 \& 4 4 4 8 4 4 2 4 4 4 2 4 4 2 2 2 2 2 2 2 2 1 2 2 2 2 2 2 2 2 2 2 8 8 ...
252 \& ... ...
253 \& ... ...
254 .Ve
255 .PP
256 The current release of MayaChemTools generates the following types of topological atom triplets
257 fingerprints vector strings:
258 .PP
259 .Vb 7
260 \& FingerprintsVector;TopologicalAtomTriplets:AtomicInvariantsAtomTypes:M
261 \& inDistance1:MaxDistance10;3096;NumericalValues;IDsAndValuesString;C.X1
262 \& .BO1.H3\-D1\-C.X1.BO1.H3\-D1\-C.X3.BO3.H1\-D2 C.X1.BO1.H3\-D1\-C.X2.BO2.H2\-D1
263 \& 0\-C.X3.BO4\-D9 C.X1.BO1.H3\-D1\-C.X2.BO2.H2\-D3\-N.X3.BO3\-D4 C.X1.BO1.H3\-D1
264 \& \-C.X2.BO2.H2\-D4\-C.X2.BO2.H2\-D5 C.X1.BO1.H3\-D1\-C.X2.BO2.H2\-D6\-C.X3....;
265 \& 1 2 2 2 2 2 2 2 8 8 4 8 4 4 2 2 2 2 4 2 2 2 4 2 2 2 2 1 2 2 4 4 4 2 2
266 \& 2 4 4 4 8 4 4 2 4 4 4 2 4 4 2 2 2 2 2 2 2 2 1 2 2 2 2 2 2 2 2 2 2 8...
267 \&
268 \& FingerprintsVector;TopologicalAtomTriplets:AtomicInvariantsAtomTypes:M
269 \& inDistance1:MaxDistance10;3096;NumericalValues;IDsAndValuesPairsString
270 \& ;C.X1.BO1.H3\-D1\-C.X1.BO1.H3\-D1\-C.X3.BO3.H1\-D2 1 C.X1.BO1.H3\-D1\-C.X2.BO
271 \& 2.H2\-D10\-C.X3.BO4\-D9 2 C.X1.BO1.H3\-D1\-C.X2.BO2.H2\-D3\-N.X3.BO3\-D4 2 C.X
272 \& 1.BO1.H3\-D1\-C.X2.BO2.H2\-D4\-C.X2.BO2.H2\-D5 2 C.X1.BO1.H3\-D1\-C.X2.BO2.H2
273 \& \-D6\-C.X3.BO3.H1\-D5 2 C.X1.BO1.H3\-D1\-C.X2.BO2.H2\-D6\-C.X3.BO3.H1\-D7 2...
274 \&
275 \& FingerprintsVector;TopologicalAtomTriplets:DREIDINGAtomTypes:MinDistan
276 \& ce1:MaxDistance10;2377;NumericalValues;IDsAndValuesString;C_2\-D1\-C_2\-D
277 \& 9\-C_3\-D10 C_2\-D1\-C_2\-D9\-C_R\-D10 C_2\-D1\-C_3\-D1\-C_3\-D2 C_2\-D1\-C_3\-D10\-C_
278 \& 3\-D9 C_2\-D1\-C_3\-D2\-C_3\-D3 C_2\-D1\-C_3\-D2\-C_R\-D3 C_2\-D1\-C_3\-D3\-C_3\-D4 C_
279 \& 2\-D1\-C_3\-D3\-N_R\-D4 C_2\-D1\-C_3\-D3\-O_3\-D2 C_2\-D1\-C_3\-D4\-C_3\-D5 C_2\-D...;
280 \& 1 1 1 2 1 1 3 1 1 2 2 1 1 1 1 1 1 1 1 2 1 3 4 5 1 1 6 4 2 2 3 1 1 1 2
281 \& 2 1 2 1 1 2 2 2 1 2 1 2 1 1 3 3 2 6 4 2 1 1 1 2 2 1 1 1 1 1 1 1 1 1...
282 \&
283 \& FingerprintsVector;TopologicalAtomTriplets:EStateAtomTypes:MinDistance
284 \& 1:MaxDistance10;3298;NumericalValues;IDsAndValuesString;aaCH\-D1\-aaCH\-D
285 \& 1\-aaCH\-D2 aaCH\-D1\-aaCH\-D1\-aasC\-D2 aaCH\-D1\-aaCH\-D10\-aaCH\-D9 aaCH\-D1\-aaC
286 \& H\-D10\-aasC\-D9 aaCH\-D1\-aaCH\-D2\-aaCH\-D3 aaCH\-D1\-aaCH\-D2\-aasC\-D1 aaCH\-D1\-
287 \& aaCH\-D2\-aasC\-D3 aaCH\-D1\-aaCH\-D3\-aasC\-D2 aaCH\-D1\-aaCH\-D4\-aasC\-D5 aa...;
288 \& 6 4 24 4 16 8 8 4 8 8 8 12 10 14 4 16 24 4 12 2 2 4 1 10 2 2 15 2 2 2
289 \& 2 2 2 14 4 2 2 2 2 1 2 10 2 2 4 1 2 4 8 3 3 3 4 6 4 2 2 3 3 1 1 1 2 1
290 \& 2 2 4 2 3 2 1 2 4 5 3 2 2 1 2 4 3 2 8 12 6 2 2 4 4 7 1 4 2 4 2 2 2 ...
291 \&
292 \& FingerprintsVector;TopologicalAtomTriplets:FunctionalClassAtomTypes:Mi
293 \& nDistance1:MaxDistance10;2182;NumericalValues;IDsAndValuesString;Ar\-D1
294 \& \-Ar\-D1\-Ar\-D2 Ar\-D1\-Ar\-D1\-Ar.HBA\-D2 Ar\-D1\-Ar\-D10\-Ar\-D9 Ar\-D1\-Ar\-D10\-Hal
295 \& \-D9 Ar\-D1\-Ar\-D2\-Ar\-D2 Ar\-D1\-Ar\-D2\-Ar\-D3 Ar\-D1\-Ar\-D2\-Ar.HBA\-D1 Ar\-D1\-Ar
296 \& \-D2\-Ar.HBA\-D2 Ar\-D1\-Ar\-D2\-Ar.HBA\-D3 Ar\-D1\-Ar\-D2\-HBD\-D1 Ar\-D1\-Ar\-D2...;
297 \& 27 1 32 2 2 63 3 2 1 2 1 2 3 1 1 40 3 1 2 2 2 2 4 2 2 47 4 2 2 1 2 1 5
298 \& 2 2 51 4 3 1 3 1 9 1 1 50 3 3 4 1 9 50 2 2 3 3 5 45 1 1 1 2 1 2 2 3 3
299 \& 4 4 3 2 1 1 3 4 5 5 3 1 2 3 2 3 5 7 2 7 3 7 1 1 2 2 2 2 3 1 4 3 1 2...
300 \&
301 \& FingerprintsVector;TopologicalAtomTriplets:MMFF94AtomTypes:MinDistance
302 \& 1:MaxDistance10;2966;NumericalValues;IDsAndValuesString;C5A\-D1\-C5A\-D1\-
303 \& N5\-D2 C5A\-D1\-C5A\-D2\-C5B\-D2 C5A\-D1\-C5A\-D3\-CB\-D2 C5A\-D1\-C5A\-D3\-CR\-D2 C5A
304 \& \-D1\-C5B\-D1\-C5B\-D2 C5A\-D1\-C5B\-D2\-C=ON\-D1 C5A\-D1\-C5B\-D2\-CB\-D1 C5A\-D1\-C5B
305 \& \-D3\-C=ON\-D2 C5A\-D1\-C5B\-D3\-CB\-D2 C5A\-D1\-C=ON\-D3\-NC=O\-D2 C5A\-D1\-C=ON\-D3\-
306 \& O=CN\-D2 C5A\-D1\-C=ON\-D4\-NC=O\-D3 C5A\-D1\-C=ON\-D4\-O=CN\-D3 C5A\-D1\-CB\-D1\-...
307 \&
308 \& FingerprintsVector;TopologicalAtomTriplets:SLogPAtomTypes:MinDistance1
309 \& :MaxDistance10;3710;NumericalValues;IDsAndValuesString;C1\-D1\-C1\-D1\-C11
310 \& \-D2 C1\-D1\-C1\-D1\-CS\-D2 C1\-D1\-C1\-D10\-C5\-D9 C1\-D1\-C1\-D3\-C10\-D2 C1\-D1\-C1\-D
311 \& 3\-C5\-D2 C1\-D1\-C1\-D3\-CS\-D2 C1\-D1\-C1\-D3\-CS\-D4 C1\-D1\-C1\-D4\-C10\-D5 C1\-D1\-C
312 \& 1\-D4\-C11\-D5 C1\-D1\-C1\-D5\-C10\-D4 C1\-D1\-C1\-D5\-C5\-D4 C1\-D1\-C1\-D6\-C11\-D7 C1
313 \& \-D1\-C1\-D6\-CS\-D5 C1\-D1\-C1\-D6\-CS\-D7 C1\-D1\-C1\-D8\-C11\-D9 C1\-D1\-C1\-D8\-CS...
314 \&
315 \& FingerprintsVector;TopologicalAtomTriplets:SYBYLAtomTypes:MinDistance1
316 \& :MaxDistance10;2332;NumericalValues;IDsAndValuesString;C.2\-D1\-C.2\-D9\-C
317 \& .3\-D10 C.2\-D1\-C.2\-D9\-C.ar\-D10 C.2\-D1\-C.3\-D1\-C.3\-D2 C.2\-D1\-C.3\-D10\-C.3\-
318 \& D9 C.2\-D1\-C.3\-D2\-C.3\-D3 C.2\-D1\-C.3\-D2\-C.ar\-D3 C.2\-D1\-C.3\-D3\-C.3\-D4 C.2
319 \& \-D1\-C.3\-D3\-N.ar\-D4 C.2\-D1\-C.3\-D3\-O.3\-D2 C.2\-D1\-C.3\-D4\-C.3\-D5 C.2\-D1\-C.
320 \& 3\-D5\-C.3\-D6 C.2\-D1\-C.3\-D5\-O.3\-D4 C.2\-D1\-C.3\-D6\-C.3\-D7 C.2\-D1\-C.3\-D7...
321 \&
322 \& FingerprintsVector;TopologicalAtomTriplets:TPSAAtomTypes:MinDistance1:
323 \& MaxDistance10;1007;NumericalValues;IDsAndValuesString;N21\-D1\-N7\-D3\-Non
324 \& e\-D4 N21\-D1\-N7\-D5\-None\-D4 N21\-D1\-None\-D1\-None\-D2 N21\-D1\-None\-D2\-None\-D
325 \& 2 N21\-D1\-None\-D2\-None\-D3 N21\-D1\-None\-D3\-None\-D4 N21\-D1\-None\-D4\-None\-D5
326 \& N21\-D1\-None\-D4\-O3\-D3 N21\-D1\-None\-D4\-O4\-D3 N21\-D1\-None\-D5\-None\-D6 N21\-
327 \& D1\-None\-D6\-None\-D7 N21\-D1\-None\-D6\-O4\-D5 N21\-D1\-None\-D7\-None\-D8 N21\-...
328 \&
329 \& FingerprintsVector;TopologicalAtomTriplets:UFFAtomTypes:MinDistance1:M
330 \& axDistance10;2377;NumericalValues;IDsAndValuesString;C_2\-D1\-C_2\-D9\-C_3
331 \& \-D10 C_2\-D1\-C_2\-D9\-C_R\-D10 C_2\-D1\-C_3\-D1\-C_3\-D2 C_2\-D1\-C_3\-D10\-C_3\-D9
332 \& C_2\-D1\-C_3\-D2\-C_3\-D3 C_2\-D1\-C_3\-D2\-C_R\-D3 C_2\-D1\-C_3\-D3\-C_3\-D4 C_2\-D1\-
333 \& C_3\-D3\-N_R\-D4 C_2\-D1\-C_3\-D3\-O_3\-D2 C_2\-D1\-C_3\-D4\-C_3\-D5 C_2\-D1\-C_3\-D5\-
334 \& C_3\-D6 C_2\-D1\-C_3\-D5\-O_3\-D4 C_2\-D1\-C_3\-D6\-C_3\-D7 C_2\-D1\-C_3\-D7\-C_3\-...
335 .Ve
336 .SH "OPTIONS"
337 .IX Header "OPTIONS"
338 .IP "\fB\-\-AromaticityModel\fR \fIMDLAromaticityModel | TriposAromaticityModel | MMFFAromaticityModel | ChemAxonBasicAromaticityModel | ChemAxonGeneralAromaticityModel | DaylightAromaticityModel | MayaChemToolsAromaticityModel\fR" 4
339 .IX Item "--AromaticityModel MDLAromaticityModel | TriposAromaticityModel | MMFFAromaticityModel | ChemAxonBasicAromaticityModel | ChemAxonGeneralAromaticityModel | DaylightAromaticityModel | MayaChemToolsAromaticityModel"
340 Specify aromaticity model to use during detection of aromaticity. Possible values in the current
341 release are: \fIMDLAromaticityModel, TriposAromaticityModel, MMFFAromaticityModel,
342 ChemAxonBasicAromaticityModel, ChemAxonGeneralAromaticityModel, DaylightAromaticityModel
343 or MayaChemToolsAromaticityModel\fR. Default value: \fIMayaChemToolsAromaticityModel\fR.
344 .Sp
345 The supported aromaticity model names along with model specific control parameters
346 are defined in \fBAromaticityModelsData.csv\fR, which is distributed with the current release
347 and is available under \fBlib/data\fR directory. \fBMolecule.pm\fR module retrieves data from
348 this file during class instantiation and makes it available to method \fBDetectAromaticity\fR
349 for detecting aromaticity corresponding to a specific model.
350 .IP "\fB\-a, \-\-AtomIdentifierType\fR \fIAtomicInvariantsAtomTypes | DREIDINGAtomTypes | EStateAtomTypes | FunctionalClassAtomTypes | MMFF94AtomTypes | SLogPAtomTypes | SYBYLAtomTypes | TPSAAtomTypes | UFFAtomTypes\fR" 4
351 .IX Item "-a, --AtomIdentifierType AtomicInvariantsAtomTypes | DREIDINGAtomTypes | EStateAtomTypes | FunctionalClassAtomTypes | MMFF94AtomTypes | SLogPAtomTypes | SYBYLAtomTypes | TPSAAtomTypes | UFFAtomTypes"
352 Specify atom identifier type to use for assignment of initial atom identifier to non-hydrogen
353 atoms during calculation of topological atom triplets fingerprints. Possible values in the current
354 release are: \fIAtomicInvariantsAtomTypes, DREIDINGAtomTypes, EStateAtomTypes,
355 FunctionalClassAtomTypes, MMFF94AtomTypes, SLogPAtomTypes, SYBYLAtomTypes,
356 TPSAAtomTypes, UFFAtomTypes\fR. Default value: \fIAtomicInvariantsAtomTypes\fR.
357 .ie n .IP "\fB\-\-AtomicInvariantsToUse\fR \fI""AtomicInvariant,AtomicInvariant...""\fR" 4
358 .el .IP "\fB\-\-AtomicInvariantsToUse\fR \fI``AtomicInvariant,AtomicInvariant...''\fR" 4
359 .IX Item "--AtomicInvariantsToUse AtomicInvariant,AtomicInvariant..."
360 This value is used during \fIAtomicInvariantsAtomTypes\fR value of \fBa, \-\-AtomIdentifierType\fR
361 option. It's a list of comma separated valid atomic invariant atom types.
362 .Sp
363 Possible values for atomic invariants are: \fI\s-1AS\s0, X, \s-1BO\s0, \s-1LBO\s0, \s-1SB\s0, \s-1DB\s0, \s-1TB\s0,
364 H, Ar, \s-1RA\s0, \s-1FC\s0, \s-1MN\s0, \s-1SM\s0\fR. Default value: \fI\s-1AS\s0,X,BO,H,FC\fR.
365 .Sp
366 The atomic invariants abbreviations correspond to:
367 .Sp
368 .Vb 1
369 \& AS = Atom symbol corresponding to element symbol
370 \&
371 \& X<n> = Number of non\-hydrogen atom neighbors or heavy atoms
372 \& BO<n> = Sum of bond orders to non\-hydrogen atom neighbors or heavy atoms
373 \& LBO<n> = Largest bond order of non\-hydrogen atom neighbors or heavy atoms
374 \& SB<n> = Number of single bonds to non\-hydrogen atom neighbors or heavy atoms
375 \& DB<n> = Number of double bonds to non\-hydrogen atom neighbors or heavy atoms
376 \& TB<n> = Number of triple bonds to non\-hydrogen atom neighbors or heavy atoms
377 \& H<n> = Number of implicit and explicit hydrogens for atom
378 \& Ar = Aromatic annotation indicating whether atom is aromatic
379 \& RA = Ring atom annotation indicating whether atom is a ring
380 \& FC<+n/\-n> = Formal charge assigned to atom
381 \& MN<n> = Mass number indicating isotope other than most abundant isotope
382 \& SM<n> = Spin multiplicity of atom. Possible values: 1 (singlet), 2 (doublet) or
383 \& 3 (triplet)
384 .Ve
385 .Sp
386 Atom type generated by AtomTypes::AtomicInvariantsAtomTypes class corresponds to:
387 .Sp
388 .Vb 1
389 \& AS.X<n>.BO<n>.LBO<n>.<SB><n>.<DB><n>.<TB><n>.H<n>.Ar.RA.FC<+n/\-n>.MN<n>.SM<n>
390 .Ve
391 .Sp
392 Except for \s-1AS\s0 which is a required atomic invariant in atom types, all other atomic invariants are
393 optional. Atom type specification doesn't include atomic invariants with zero or undefined values.
394 .Sp
395 In addition to usage of abbreviations for specifying atomic invariants, the following descriptive words
396 are also allowed:
397 .Sp
398 .Vb 12
399 \& X : NumOfNonHydrogenAtomNeighbors or NumOfHeavyAtomNeighbors
400 \& BO : SumOfBondOrdersToNonHydrogenAtoms or SumOfBondOrdersToHeavyAtoms
401 \& LBO : LargestBondOrderToNonHydrogenAtoms or LargestBondOrderToHeavyAtoms
402 \& SB : NumOfSingleBondsToNonHydrogenAtoms or NumOfSingleBondsToHeavyAtoms
403 \& DB : NumOfDoubleBondsToNonHydrogenAtoms or NumOfDoubleBondsToHeavyAtoms
404 \& TB : NumOfTripleBondsToNonHydrogenAtoms or NumOfTripleBondsToHeavyAtoms
405 \& H : NumOfImplicitAndExplicitHydrogens
406 \& Ar : Aromatic
407 \& RA : RingAtom
408 \& FC : FormalCharge
409 \& MN : MassNumber
410 \& SM : SpinMultiplicity
411 .Ve
412 .Sp
413 \&\fIAtomTypes::AtomicInvariantsAtomTypes\fR module is used to assign atomic invariant
414 atom types.
415 .ie n .IP "\fB\-\-FunctionalClassesToUse\fR \fI""FunctionalClass1,FunctionalClass2...""\fR" 4
416 .el .IP "\fB\-\-FunctionalClassesToUse\fR \fI``FunctionalClass1,FunctionalClass2...''\fR" 4
417 .IX Item "--FunctionalClassesToUse FunctionalClass1,FunctionalClass2..."
418 This value is used during \fIFunctionalClassAtomTypes\fR value of \fBa, \-\-AtomIdentifierType\fR
419 option. It's a list of comma separated valid functional classes.
420 .Sp
421 Possible values for atom functional classes are: \fIAr, \s-1CA\s0, H, \s-1HBA\s0, \s-1HBD\s0, Hal, \s-1NI\s0, \s-1PI\s0, \s-1RA\s0\fR.
422 Default value [ Ref 24 ]: \fI\s-1HBD\s0,HBA,PI,NI,Ar,Hal\fR.
423 .Sp
424 The functional class abbreviations correspond to:
425 .Sp
426 .Vb 9
427 \& HBD: HydrogenBondDonor
428 \& HBA: HydrogenBondAcceptor
429 \& PI : PositivelyIonizable
430 \& NI : NegativelyIonizable
431 \& Ar : Aromatic
432 \& Hal : Halogen
433 \& H : Hydrophobic
434 \& RA : RingAtom
435 \& CA : ChainAtom
436 \&
437 \& Functional class atom type specification for an atom corresponds to:
438 \&
439 \& Ar.CA.H.HBA.HBD.Hal.NI.PI.RA
440 .Ve
441 .Sp
442 \&\fIAtomTypes::FunctionalClassAtomTypes\fR module is used to assign functional class atom
443 types. It uses following definitions [ Ref 60\-61, Ref 65\-66 ]:
444 .Sp
445 .Vb 4
446 \& HydrogenBondDonor: NH, NH2, OH
447 \& HydrogenBondAcceptor: N[!H], O
448 \& PositivelyIonizable: +, NH2
449 \& NegativelyIonizable: \-, C(=O)OH, S(=O)OH, P(=O)OH
450 .Ve
451 .IP "\fB\-\-CompoundID\fR \fIDataFieldName or LabelPrefixString\fR" 4
452 .IX Item "--CompoundID DataFieldName or LabelPrefixString"
453 This value is \fB\-\-CompoundIDMode\fR specific and indicates how compound \s-1ID\s0 is generated.
454 .Sp
455 For \fIDataField\fR value of \fB\-\-CompoundIDMode\fR option, it corresponds to datafield label name
456 whose value is used as compound \s-1ID\s0; otherwise, it's a prefix string used for generating compound
457 IDs like LabelPrefixString<Number>. Default value, \fICmpd\fR, generates compound IDs which
458 look like Cmpd<Number>.
459 .Sp
460 Examples for \fIDataField\fR value of \fB\-\-CompoundIDMode\fR:
461 .Sp
462 .Vb 2
463 \& MolID
464 \& ExtReg
465 .Ve
466 .Sp
467 Examples for \fILabelPrefix\fR or \fIMolNameOrLabelPrefix\fR value of \fB\-\-CompoundIDMode\fR:
468 .Sp
469 .Vb 1
470 \& Compound
471 .Ve
472 .Sp
473 The value specified above generates compound IDs which correspond to Compound<Number>
474 instead of default value of Cmpd<Number>.
475 .IP "\fB\-\-CompoundIDLabel\fR \fItext\fR" 4
476 .IX Item "--CompoundIDLabel text"
477 Specify compound \s-1ID\s0 column label for \s-1CSV/TSV\s0 text file(s) used during \fICompoundID\fR value
478 of \fB\-\-DataFieldsMode\fR option. Default value: \fICompoundID\fR.
479 .IP "\fB\-\-CompoundIDMode\fR \fIDataField | MolName | LabelPrefix | MolNameOrLabelPrefix\fR" 4
480 .IX Item "--CompoundIDMode DataField | MolName | LabelPrefix | MolNameOrLabelPrefix"
481 Specify how to generate compound IDs and write to \s-1FP\s0 or \s-1CSV/TSV\s0 text file(s) along with generated
482 fingerprints for \fI\s-1FP\s0 | text | all\fR values of \fB\-\-output\fR option: use a \fISDFile(s)\fR datafield value;
483 use molname line from \fISDFile(s)\fR; generate a sequential \s-1ID\s0 with specific prefix; use combination
484 of both MolName and LabelPrefix with usage of LabelPrefix values for empty molname lines.
485 .Sp
486 Possible values: \fIDataField | MolName | LabelPrefix | MolNameOrLabelPrefix\fR.
487 Default value: \fILabelPrefix\fR.
488 .Sp
489 For \fIMolNameAndLabelPrefix\fR value of \fB\-\-CompoundIDMode\fR, molname line in \fISDFile(s)\fR takes
490 precedence over sequential compound IDs generated using \fILabelPrefix\fR and only empty molname
491 values are replaced with sequential compound IDs.
492 .Sp
493 This is only used for \fICompoundID\fR value of \fB\-\-DataFieldsMode\fR option.
494 .ie n .IP "\fB\-\-DataFields\fR \fI""FieldLabel1,FieldLabel2,...""\fR" 4
495 .el .IP "\fB\-\-DataFields\fR \fI``FieldLabel1,FieldLabel2,...''\fR" 4
496 .IX Item "--DataFields FieldLabel1,FieldLabel2,..."
497 Comma delimited list of \fISDFiles(s)\fR data fields to extract and write to \s-1CSV/TSV\s0 text file(s) along
498 with generated fingerprints for \fItext | all\fR values of \fB\-\-output\fR option.
499 .Sp
500 This is only used for \fISpecify\fR value of \fB\-\-DataFieldsMode\fR option.
501 .Sp
502 Examples:
503 .Sp
504 .Vb 2
505 \& Extreg
506 \& MolID,CompoundName
507 .Ve
508 .IP "\fB\-d, \-\-DataFieldsMode\fR \fIAll | Common | Specify | CompoundID\fR" 4
509 .IX Item "-d, --DataFieldsMode All | Common | Specify | CompoundID"
510 Specify how data fields in \fISDFile(s)\fR are transferred to output \s-1CSV/TSV\s0 text file(s) along
511 with generated fingerprints for \fItext | all\fR values of \fB\-\-output\fR option: transfer all \s-1SD\s0
512 data field; transfer \s-1SD\s0 data files common to all compounds; extract specified data fields;
513 generate a compound \s-1ID\s0 using molname line, a compound prefix, or a combination of both.
514 Possible values: \fIAll | Common | specify | CompoundID\fR. Default value: \fICompoundID\fR.
515 .IP "\fB\-f, \-\-Filter\fR \fIYes | No\fR" 4
516 .IX Item "-f, --Filter Yes | No"
517 Specify whether to check and filter compound data in SDFile(s). Possible values: \fIYes or No\fR.
518 Default value: \fIYes\fR.
519 .Sp
520 By default, compound data is checked before calculating fingerprints and compounds containing
521 atom data corresponding to non-element symbols or no atom data are ignored.
522 .IP "\fB\-\-FingerprintsLabel\fR \fItext\fR" 4
523 .IX Item "--FingerprintsLabel text"
524 \&\s-1SD\s0 data label or text file column label to use for fingerprints string in output \s-1SD\s0 or
525 \&\s-1CSV/TSV\s0 text file(s) specified by \fB\-\-output\fR. Default value: \fITopologicalAtomTripletsFingerprints\fR.
526 .IP "\fB\-h, \-\-help\fR" 4
527 .IX Item "-h, --help"
528 Print this help message.
529 .IP "\fB\-k, \-\-KeepLargestComponent\fR \fIYes | No\fR" 4
530 .IX Item "-k, --KeepLargestComponent Yes | No"
531 Generate fingerprints for only the largest component in molecule. Possible values:
532 \&\fIYes or No\fR. Default value: \fIYes\fR.
533 .Sp
534 For molecules containing multiple connected components, fingerprints can be generated
535 in two different ways: use all connected components or just the largest connected
536 component. By default, all atoms except for the largest connected component are
537 deleted before generation of fingerprints.
538 .IP "\fB\-\-MinDistance\fR \fInumber\fR" 4
539 .IX Item "--MinDistance number"
540 Minimum bond distance between atom triplets for generating topological atom triplets. Default value:
541 \&\fI1\fR. Valid values: positive integers and less than \fB\-\-MaxDistance\fR.
542 .IP "\fB\-\-MaxDistance\fR \fInumber\fR" 4
543 .IX Item "--MaxDistance number"
544 Maximum bond distance between atom triplets for generating topological atom triplets. Default value:
545 \&\fI10\fR. Valid values: positive integers and greater than \fB\-\-MinDistance\fR.
546 .IP "\fB\-\-OutDelim\fR \fIcomma | tab | semicolon\fR" 4
547 .IX Item "--OutDelim comma | tab | semicolon"
548 Delimiter for output \s-1CSV/TSV\s0 text file(s). Possible values: \fIcomma, tab, or semicolon\fR
549 Default value: \fIcomma\fR
550 .IP "\fB\-\-output\fR \fI\s-1SD\s0 | \s-1FP\s0 | text | all\fR" 4
551 .IX Item "--output SD | FP | text | all"
552 Type of output files to generate. Possible values: \fI\s-1SD\s0, \s-1FP\s0, text, or all\fR. Default value: \fItext\fR.
553 .IP "\fB\-o, \-\-overwrite\fR" 4
554 .IX Item "-o, --overwrite"
555 Overwrite existing files.
556 .IP "\fB\-q, \-\-quote\fR \fIYes | No\fR" 4
557 .IX Item "-q, --quote Yes | No"
558 Put quote around column values in output \s-1CSV/TSV\s0 text file(s). Possible values:
559 \&\fIYes or No\fR. Default value: \fIYes\fR.
560 .IP "\fB\-r, \-\-root\fR \fIRootName\fR" 4
561 .IX Item "-r, --root RootName"
562 New file name is generated using the root: <Root>.<Ext>. Default for new file names:
563 <SDFileName><TopologicalAtomTripletsFP>.<Ext>. The file type determines <Ext> value.
564 The sdf, fpf, csv, and tsv <Ext> values are used for \s-1SD\s0, \s-1FP\s0, comma/semicolon, and tab
565 delimited text files, respectively.This option is ignored for multiple input files.
566 .IP "\fB\-u, \-\-UseTriangleInequality\fR \fIYes | No\fR" 4
567 .IX Item "-u, --UseTriangleInequality Yes | No"
568 Specify whether to imply triangle distance inequality test to distances between atom pairs in
569 atom triplets during generation of atom triplets generation. Possible values: \fIYes or No\fR.
570 Default value: \fINo\fR.
571 .Sp
572 Triangle distance inequality test implies that distance or binned distance between any two atom
573 pairs in an atom triplet must be less than the sum of distances or binned distances between other
574 two atoms pairs and greater than the difference of their distances.
575 .Sp
576 .Vb 1
577 \& For atom triplet ATx\-Dyz\-ATy\-Dxz\-ATz\-Dxy to satisfy triangle inequality:
578 \&
579 \& Dyz > |Dxz \- Dxy| and Dyz < Dxz + Dxy
580 \& Dxz > |Dyz \- Dxy| and Dyz < Dyz + Dxy
581 \& Dxy > |Dyz \- Dxz| and Dxy < Dyz + Dxz
582 .Ve
583 .IP "\fB\-v, \-\-VectorStringFormat\fR \fIIDsAndValuesString | IDsAndValuesPairsString | ValuesAndIDsString | ValuesAndIDsPairsString\fR" 4
584 .IX Item "-v, --VectorStringFormat IDsAndValuesString | IDsAndValuesPairsString | ValuesAndIDsString | ValuesAndIDsPairsString"
585 Format of fingerprints vector string data in output \s-1SD\s0, \s-1FP\s0 or \s-1CSV/TSV\s0 text file(s) specified by
586 \&\fB\-\-output\fR option. Possible values: \fIIDsAndValuesString | IDsAndValuesPairsString | ValuesAndIDsString |
587 ValuesAndIDsPairsString\fR. Default value: \fIIDsAndValuesString\fR.
588 .Sp
589 Examples:
590 .Sp
591 .Vb 7
592 \& FingerprintsVector;TopologicalAtomTriplets:AtomicInvariantsAtomTypes:M
593 \& inDistance1:MaxDistance10;3096;NumericalValues;IDsAndValuesString;C.X1
594 \& .BO1.H3\-D1\-C.X1.BO1.H3\-D1\-C.X3.BO3.H1\-D2 C.X1.BO1.H3\-D1\-C.X2.BO2.H2\-D1
595 \& 0\-C.X3.BO4\-D9 C.X1.BO1.H3\-D1\-C.X2.BO2.H2\-D3\-N.X3.BO3\-D4 C.X1.BO1.H3\-D1
596 \& \-C.X2.BO2.H2\-D4\-C.X2.BO2.H2\-D5 C.X1.BO1.H3\-D1\-C.X2.BO2.H2\-D6\-C.X3....;
597 \& 1 2 2 2 2 2 2 2 8 8 4 8 4 4 2 2 2 2 4 2 2 2 4 2 2 2 2 1 2 2 4 4 4 2 2
598 \& 2 4 4 4 8 4 4 2 4 4 4 2 4 4 2 2 2 2 2 2 2 2 1 2 2 2 2 2 2 2 2 2 2 8...
599 \&
600 \& FingerprintsVector;TopologicalAtomTriplets:AtomicInvariantsAtomTypes:M
601 \& inDistance1:MaxDistance10;3096;NumericalValues;IDsAndValuesPairsString
602 \& ;C.X1.BO1.H3\-D1\-C.X1.BO1.H3\-D1\-C.X3.BO3.H1\-D2 1 C.X1.BO1.H3\-D1\-C.X2.BO
603 \& 2.H2\-D10\-C.X3.BO4\-D9 2 C.X1.BO1.H3\-D1\-C.X2.BO2.H2\-D3\-N.X3.BO3\-D4 2 C.X
604 \& 1.BO1.H3\-D1\-C.X2.BO2.H2\-D4\-C.X2.BO2.H2\-D5 2 C.X1.BO1.H3\-D1\-C.X2.BO2.H2
605 \& \-D6\-C.X3.BO3.H1\-D5 2 C.X1.BO1.H3\-D1\-C.X2.BO2.H2\-D6\-C.X3.BO3.H1\-D7 2...
606 .Ve
607 .IP "\fB\-w, \-\-WorkingDir\fR \fIDirName\fR" 4
608 .IX Item "-w, --WorkingDir DirName"
609 Location of working directory. Default value: current directory.
610 .SH "EXAMPLES"
611 .IX Header "EXAMPLES"
612 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
613 10 using atomic invariants atom types in IDsAndValuesString format and create a SampleTATFP.csv
614 file containing sequential compound IDs along with fingerprints vector strings data, type:
615 .PP
616 .Vb 1
617 \& % TopologicalAtomTripletsFingerprints.pl \-r SampleTATFP \-o Sample.sdf
618 .Ve
619 .PP
620 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
621 10 using atomic invariants atom types in IDsAndValuesString format and create SampleTATFP.sdf,
622 SampleTATFP.fpf and SampleTATFP.csv files containing sequential compound IDs in \s-1CSV\s0 file along
623 with fingerprints vector strings data, type:
624 .PP
625 .Vb 2
626 \& % TopologicalAtomTripletsFingerprints.pl \-\-output all \-r SampleTATFP
627 \& \-o Sample.sdf
628 .Ve
629 .PP
630 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
631 10 using atomic invariants atom types in IDsAndValuesPairsString format and create a SampleTATFP.csv
632 file containing sequential compound IDs along with fingerprints vector strings data, type:
633 .PP
634 .Vb 2
635 \& % TopologicalAtomTripletsFingerprints.pl \-\-VectorStringFormat
636 \& IDsAndValuesPairsString \-r SampleTATFP \-o Sample.sdf
637 .Ve
638 .PP
639 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
640 10 using \s-1DREIDING\s0 atom types in IDsAndValuesString format and create a SampleTATFP.csv
641 file containing sequential compound IDs along with fingerprints vector strings data, type:
642 .PP
643 .Vb 2
644 \& % TopologicalAtomTripletsFingerprints.pl \-a DREIDINGAtomTypes
645 \& \-r SampleTATFP \-o Sample.sdf
646 .Ve
647 .PP
648 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
649 10 using E\-state atom types in IDsAndValuesString format and create a SampleTATFP.csv
650 file containing sequential compound IDs along with fingerprints vector strings data, type:
651 .PP
652 .Vb 2
653 \& % TopologicalAtomTripletsFingerprints.pl \-a EStateAtomTypes
654 \& \-r SampleTATFP \-o Sample.sdf
655 .Ve
656 .PP
657 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
658 10 using functional class atom types in IDsAndValuesString format and create a SampleTATFP.csv
659 file containing sequential compound IDs along with fingerprints vector strings data, type:
660 .PP
661 .Vb 2
662 \& % TopologicalAtomTripletsFingerprints.pl \-a FunctionalClassAtomTypes
663 \& \-r SampleTATFP \-o Sample.sdf
664 .Ve
665 .PP
666 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
667 10 using \s-1DREIDING\s0 atom types in IDsAndValuesString format and create a SampleTATFP.csv
668 file containing sequential compound IDs along with fingerprints vector strings data, type:
669 .PP
670 .Vb 2
671 \& % TopologicalAtomTripletsFingerprints.pl \-a DREIDINGAtomTypes
672 \& \-r SampleTATFP \-o Sample.sdf
673 .Ve
674 .PP
675 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
676 10 using \s-1MM94\s0 atom types in IDsAndValuesString format and create a SampleTATFP.csv
677 file containing sequential compound IDs along with fingerprints vector strings data, type:
678 .PP
679 .Vb 2
680 \& % TopologicalAtomTripletsFingerprints.pl \-a MMFF94AtomTypes
681 \& \-r SampleTATFP \-o Sample.sdf
682 .Ve
683 .PP
684 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
685 10 using SLogP atom types in IDsAndValuesString format and create a SampleTATFP.csv
686 file containing sequential compound IDs along with fingerprints vector strings data, type:
687 .PP
688 .Vb 2
689 \& % TopologicalAtomTripletsFingerprints.pl \-a SLogPAtomTypes
690 \& \-r SampleTATFP \-o Sample.sdf
691 .Ve
692 .PP
693 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
694 10 using \s-1SYBYL\s0 atom types in IDsAndValuesString format and create a SampleTATFP.csv
695 file containing sequential compound IDs along with fingerprints vector strings data, type:
696 .PP
697 .Vb 2
698 \& % TopologicalAtomTripletsFingerprints.pl \-a SYBYLAtomTypes
699 \& \-r SampleTATFP \-o Sample.sdf
700 .Ve
701 .PP
702 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
703 10 using \s-1TPSA\s0 atom types in IDsAndValuesString format and create a SampleTATFP.csv
704 file containing sequential compound IDs along with fingerprints vector strings data, type:
705 .PP
706 .Vb 2
707 \& % TopologicalAtomTripletsFingerprints.pl \-a TPSAAtomTypes
708 \& \-r SampleTATFP \-o Sample.sdf
709 .Ve
710 .PP
711 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
712 10 using \s-1UFF\s0 atom types in IDsAndValuesString format and create a SampleTATFP.csv
713 file containing sequential compound IDs along with fingerprints vector strings data, type:
714 .PP
715 .Vb 2
716 \& % TopologicalAtomTripletsFingerprints.pl \-a UFFAtomTypes
717 \& \-r SampleTATFP \-o Sample.sdf
718 .Ve
719 .PP
720 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
721 6 using atomic invariants atom types in IDsAndValuesString format and create a SampleTATFP.csv
722 file containing sequential compound IDs along with fingerprints vector strings data, type:
723 .PP
724 .Vb 2
725 \& % TopologicalAtomTripletsFingerprints.pl \-a AtomicInvariantsAtomTypes
726 \& \-\-MinDistance 1 \-\-MaxDistance 6 \-r SampleTATFP \-o Sample.sdf
727 .Ve
728 .PP
729 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
730 10 using only \s-1AS\s0,X atomic invariants atom types in IDsAndValuesString format and create a
731 SampleTATFP.csv file containing sequential compound IDs along with fingerprints vector strings
732 data, type:
733 .PP
734 .Vb 3
735 \& % TopologicalAtomTripletsFingerprints.pl \-a AtomicInvariantsAtomTypes
736 \& \-\-AtomicInvariantsToUse "AS,X" \-\-MinDistance 1 \-\-MaxDistance 6
737 \& \-r SampleTATFP \-o Sample.sdf
738 .Ve
739 .PP
740 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
741 10 using atomic invariants atom types in IDsAndValuesString format and create a SampleTATFP.csv
742 file containing compound \s-1ID\s0 from molecule name line along with fingerprints vector strings
743 data, type:
744 .PP
745 .Vb 3
746 \& % TopologicalAtomTripletsFingerprints.pl \-a AtomicInvariantsAtomTypes
747 \& \-\-DataFieldsMode CompoundID \-CompoundIDMode MolName
748 \& \-r SampleTATFP \-o Sample.sdf
749 .Ve
750 .PP
751 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
752 10 using atomic invariants atom types in IDsAndValuesString format and create a SampleTATFP.csv
753 file containing compound IDs using specified data field along with fingerprints vector strings
754 data, type:
755 .PP
756 .Vb 3
757 \& % TopologicalAtomTripletsFingerprints.pl \-a AtomicInvariantsAtomTypes
758 \& \-\-DataFieldsMode CompoundID \-CompoundIDMode DataField \-\-CompoundID
759 \& Mol_ID \-r SampleTATFP \-o Sample.sdf
760 .Ve
761 .PP
762 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
763 10 using atomic invariants atom types in IDsAndValuesString format and create a SampleTATFP.csv
764 file containing compound \s-1ID\s0 using combination of molecule name line and an explicit compound
765 prefix along with fingerprints vector strings data, type:
766 .PP
767 .Vb 3
768 \& % TopologicalAtomTripletsFingerprints.pl \-a AtomicInvariantsAtomTypes
769 \& \-\-DataFieldsMode CompoundID \-CompoundIDMode MolnameOrLabelPrefix
770 \& \-\-CompoundID Cmpd \-\-CompoundIDLabel MolID \-r SampleTATFP \-o Sample.sdf
771 .Ve
772 .PP
773 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
774 10 using atomic invariants atom types in IDsAndValuesString format and create a SampleTATFP.csv
775 file containing specific data fields columns along with fingerprints vector strings
776 data, type:
777 .PP
778 .Vb 3
779 \& % TopologicalAtomTripletsFingerprints.pl \-a AtomicInvariantsAtomTypes
780 \& \-\-DataFieldsMode Specify \-\-DataFields Mol_ID \-r SampleTATFP
781 \& \-o Sample.sdf
782 .Ve
783 .PP
784 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
785 10 using atomic invariants atom types in IDsAndValuesString format and create a SampleTATFP.csv
786 file containing common data fields columns along with fingerprints vector strings
787 data, type:
788 .PP
789 .Vb 2
790 \& % TopologicalAtomTripletsFingerprints.pl \-a AtomicInvariantsAtomTypes
791 \& \-\-DataFieldsMode Common \-r SampleTATFP \-o Sample.sdf
792 .Ve
793 .PP
794 To generate topological atom triplets fingerprints corresponding to bond distances from 1 through
795 10 using atomic invariants atom types in IDsAndValuesString format and create SampleTATFP.sdf,
796 SampleTATFP.fpf and SampleTATFP.csv files containing all data fields columns in \s-1CSV\s0 file along with
797 fingerprints data, type:
798 .PP
799 .Vb 3
800 \& % TopologicalAtomTripletsFingerprints.pl \-a AtomicInvariantsAtomTypes
801 \& \-\-DataFieldsMode All \-\-output all \-r SampleTATFP
802 \& \-o Sample.sdf
803 .Ve
804 .SH "AUTHOR"
805 .IX Header "AUTHOR"
806 Manish Sud <msud@san.rr.com>
807 .SH "SEE ALSO"
808 .IX Header "SEE ALSO"
809 InfoFingerprintsFiles.pl, SimilarityMatricesFingerprints.pl, AtomNeighborhoodsFingerprints.pl,
810 ExtendedConnectivityFingerprints.pl, MACCSKeysFingerprints.pl,
811 PathLengthFingerprints.pl, TopologicalAtomTorsionsFingerprints.pl,
812 TopologicalPharmacophoreAtomPairsFingerprints.pl, TopologicalPharmacophoreAtomTripletsFingerprints.pl
813 .SH "COPYRIGHT"
814 .IX Header "COPYRIGHT"
815 Copyright (C) 2015 Manish Sud. All rights reserved.
816 .PP
817 This file is part of MayaChemTools.
818 .PP
819 MayaChemTools is free software; you can redistribute it and/or modify it under
820 the terms of the \s-1GNU\s0 Lesser General Public License as published by the Free
821 Software Foundation; either version 3 of the License, or (at your option)
822 any later version.