comparison docs/scripts/man1/AtomNeighborhoodsFingerprints.1 @ 0:4816e4a8ae95 draft default tip

Uploaded
author deepakjadmin
date Wed, 20 Jan 2016 09:23:18 -0500
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:4816e4a8ae95
1 .\" Automatically generated by Pod::Man 2.25 (Pod::Simple 3.22)
2 .\"
3 .\" Standard preamble:
4 .\" ========================================================================
5 .de Sp \" Vertical space (when we can't use .PP)
6 .if t .sp .5v
7 .if n .sp
8 ..
9 .de Vb \" Begin verbatim text
10 .ft CW
11 .nf
12 .ne \\$1
13 ..
14 .de Ve \" End verbatim text
15 .ft R
16 .fi
17 ..
18 .\" Set up some character translations and predefined strings. \*(-- will
19 .\" give an unbreakable dash, \*(PI will give pi, \*(L" will give a left
20 .\" double quote, and \*(R" will give a right double quote. \*(C+ will
21 .\" give a nicer C++. Capital omega is used to do unbreakable dashes and
22 .\" therefore won't be available. \*(C` and \*(C' expand to `' in nroff,
23 .\" nothing in troff, for use with C<>.
24 .tr \(*W-
25 .ds C+ C\v'-.1v'\h'-1p'\s-2+\h'-1p'+\s0\v'.1v'\h'-1p'
26 .ie n \{\
27 . ds -- \(*W-
28 . ds PI pi
29 . if (\n(.H=4u)&(1m=24u) .ds -- \(*W\h'-12u'\(*W\h'-12u'-\" diablo 10 pitch
30 . if (\n(.H=4u)&(1m=20u) .ds -- \(*W\h'-12u'\(*W\h'-8u'-\" diablo 12 pitch
31 . ds L" ""
32 . ds R" ""
33 . ds C` ""
34 . ds C' ""
35 'br\}
36 .el\{\
37 . ds -- \|\(em\|
38 . ds PI \(*p
39 . ds L" ``
40 . ds R" ''
41 'br\}
42 .\"
43 .\" Escape single quotes in literal strings from groff's Unicode transform.
44 .ie \n(.g .ds Aq \(aq
45 .el .ds Aq '
46 .\"
47 .\" If the F register is turned on, we'll generate index entries on stderr for
48 .\" titles (.TH), headers (.SH), subsections (.SS), items (.Ip), and index
49 .\" entries marked with X<> in POD. Of course, you'll have to process the
50 .\" output yourself in some meaningful fashion.
51 .ie \nF \{\
52 . de IX
53 . tm Index:\\$1\t\\n%\t"\\$2"
54 ..
55 . nr % 0
56 . rr F
57 .\}
58 .el \{\
59 . de IX
60 ..
61 .\}
62 .\"
63 .\" Accent mark definitions (@(#)ms.acc 1.5 88/02/08 SMI; from UCB 4.2).
64 .\" Fear. Run. Save yourself. No user-serviceable parts.
65 . \" fudge factors for nroff and troff
66 .if n \{\
67 . ds #H 0
68 . ds #V .8m
69 . ds #F .3m
70 . ds #[ \f1
71 . ds #] \fP
72 .\}
73 .if t \{\
74 . ds #H ((1u-(\\\\n(.fu%2u))*.13m)
75 . ds #V .6m
76 . ds #F 0
77 . ds #[ \&
78 . ds #] \&
79 .\}
80 . \" simple accents for nroff and troff
81 .if n \{\
82 . ds ' \&
83 . ds ` \&
84 . ds ^ \&
85 . ds , \&
86 . ds ~ ~
87 . ds /
88 .\}
89 .if t \{\
90 . ds ' \\k:\h'-(\\n(.wu*8/10-\*(#H)'\'\h"|\\n:u"
91 . ds ` \\k:\h'-(\\n(.wu*8/10-\*(#H)'\`\h'|\\n:u'
92 . ds ^ \\k:\h'-(\\n(.wu*10/11-\*(#H)'^\h'|\\n:u'
93 . ds , \\k:\h'-(\\n(.wu*8/10)',\h'|\\n:u'
94 . ds ~ \\k:\h'-(\\n(.wu-\*(#H-.1m)'~\h'|\\n:u'
95 . ds / \\k:\h'-(\\n(.wu*8/10-\*(#H)'\z\(sl\h'|\\n:u'
96 .\}
97 . \" troff and (daisy-wheel) nroff accents
98 .ds : \\k:\h'-(\\n(.wu*8/10-\*(#H+.1m+\*(#F)'\v'-\*(#V'\z.\h'.2m+\*(#F'.\h'|\\n:u'\v'\*(#V'
99 .ds 8 \h'\*(#H'\(*b\h'-\*(#H'
100 .ds o \\k:\h'-(\\n(.wu+\w'\(de'u-\*(#H)/2u'\v'-.3n'\*(#[\z\(de\v'.3n'\h'|\\n:u'\*(#]
101 .ds d- \h'\*(#H'\(pd\h'-\w'~'u'\v'-.25m'\f2\(hy\fP\v'.25m'\h'-\*(#H'
102 .ds D- D\\k:\h'-\w'D'u'\v'-.11m'\z\(hy\v'.11m'\h'|\\n:u'
103 .ds th \*(#[\v'.3m'\s+1I\s-1\v'-.3m'\h'-(\w'I'u*2/3)'\s-1o\s+1\*(#]
104 .ds Th \*(#[\s+2I\s-2\h'-\w'I'u*3/5'\v'-.3m'o\v'.3m'\*(#]
105 .ds ae a\h'-(\w'a'u*4/10)'e
106 .ds Ae A\h'-(\w'A'u*4/10)'E
107 . \" corrections for vroff
108 .if v .ds ~ \\k:\h'-(\\n(.wu*9/10-\*(#H)'\s-2\u~\d\s+2\h'|\\n:u'
109 .if v .ds ^ \\k:\h'-(\\n(.wu*10/11-\*(#H)'\v'-.4m'^\v'.4m'\h'|\\n:u'
110 . \" for low resolution devices (crt and lpr)
111 .if \n(.H>23 .if \n(.V>19 \
112 \{\
113 . ds : e
114 . ds 8 ss
115 . ds o a
116 . ds d- d\h'-1'\(ga
117 . ds D- D\h'-1'\(hy
118 . ds th \o'bp'
119 . ds Th \o'LP'
120 . ds ae ae
121 . ds Ae AE
122 .\}
123 .rm #[ #] #H #V #F C
124 .\" ========================================================================
125 .\"
126 .IX Title "ATOMNEIGHBORHOODSFINGERPRINTS 1"
127 .TH ATOMNEIGHBORHOODSFINGERPRINTS 1 "2015-03-29" "perl v5.14.2" "MayaChemTools"
128 .\" For nroff, turn off justification. Always turn off hyphenation; it makes
129 .\" way too many mistakes in technical documents.
130 .if n .ad l
131 .nh
132 .SH "NAME"
133 AtomNeighborhoodsFingerprints.pl \- Generate atom neighborhoods fingerprints for SD files
134 .SH "SYNOPSIS"
135 .IX Header "SYNOPSIS"
136 AtomNeighborhoodsFingerprints.pl SDFile(s)...
137 .PP
138 AtomNeighborhoodsFingerprints.pl [\fB\-\-AromaticityModel\fR \fIAromaticityModelType\fR]
139 [\fB\-a, \-\-AtomIdentifierType\fR \fIAtomicInvariantsAtomTypes |
140 DREIDINGAtomTypes | EStateAtomTypes | MMFF94AtomTypes | SLogPAtomTypes | SYBYLAtomTypes | TPSAAtomTypes | UFFAtomTypes\fR]
141 [\fB\-\-AtomicInvariantsToUse\fR \fI\*(L"AtomicInvariant,AtomicInvariant...\*(R"\fR]
142 [\fB\-\-FunctionalClassesToUse\fR \fI\*(L"FunctionalClass1,FunctionalClass2...\*(R"\fR]
143 [\fB\-\-CompoundID\fR \fIDataFieldName or LabelPrefixString\fR] [\fB\-\-CompoundIDLabel\fR \fItext\fR]
144 [\fB\-\-CompoundIDMode\fR] [\fB\-\-DataFields\fR \fI\*(L"FieldLabel1,FieldLabel2,...\*(R"\fR]
145 [\fB\-d, \-\-DataFieldsMode\fR \fIAll | Common | Specify | CompoundID\fR] [\fB\-f, \-\-Filter\fR \fIYes | No\fR]
146 [\fB\-\-FingerprintsLabel\fR \fItext\fR] [\fB\-h, \-\-help\fR] [\fB\-k, \-\-KeepLargestComponent\fR \fIYes | No\fR]
147 [\fB\-\-MinNeighborhoodRadius\fR \fInumber\fR] [\fB\-\-MaxNeighborhoodRadius\fR \fInumber\fR]
148 [\fB\-\-OutDelim\fR \fIcomma | tab | semicolon\fR] [\fB\-\-output\fR \fI\s-1SD\s0 | \s-1FP\s0 | text | all\fR] [\fB\-o, \-\-overwrite\fR]
149 [\fB\-q, \-\-quote\fR \fIYes | No\fR] [\fB\-r, \-\-root\fR \fIRootName\fR]
150 [\fB\-w, \-\-WorkingDir\fR dirname] SDFile(s)...
151 .SH "DESCRIPTION"
152 .IX Header "DESCRIPTION"
153 Generate atom neighborhoods fingerprints [ Ref 53\-56, Ref 73 ] for \fISDFile(s)\fR and create appropriate
154 \&\s-1SD\s0, \s-1FP\s0 or \s-1CSV/TSV\s0 text file(s) containing fingerprints vector strings corresponding to molecular fingerprints.
155 .PP
156 Multiple SDFile names are separated by spaces. The valid file extensions are \fI.sdf\fR
157 and \fI.sd\fR. All other file names are ignored. All the \s-1SD\s0 files in a current directory
158 can be specified either by \fI*.sdf\fR or the current directory name.
159 .PP
160 The current release of MayaChemTools supports generation of atom neighborhoods fingerprints
161 corresponding to following \fB\-a, \-\-AtomIdentifierTypes\fR:
162 .PP
163 .Vb 3
164 \& AtomicInvariantsAtomTypes, DREIDINGAtomTypes, EStateAtomTypes,
165 \& FunctionalClassAtomTypes, MMFF94AtomTypes, SLogPAtomTypes,
166 \& SYBYLAtomTypes, TPSAAtomTypes, UFFAtomTypes
167 .Ve
168 .PP
169 Based on the values specified for \fB\-a, \-\-AtomIdentifierType\fR and \fB\-\-AtomicInvariantsToUse\fR,
170 initial atom types are assigned to all non-hydrogen atoms in a molecule. Using atom neighborhoods
171 around each non-hydrogen central atom corresponding to radii between specified values
172 \&\fB\-\-MinNeighborhoodRadius\fR and \fB\-\-MaxNeighborhoodRadius\fR, unique atom types at
173 each radii level are counted and an atom neighborhood identifier is generated.
174 .PP
175 The format of an atom neighborhood identifier around a central non-hydrogen atom at a
176 specific radius is:
177 .PP
178 .Vb 1
179 \& NR<n>\-<AtomType>\-ATC<n>
180 \&
181 \& NR: Neighborhood radius
182 \& AtomType: Assigned atom type
183 \& ATC: Atom type count
184 .Ve
185 .PP
186 The atom neighborhood identifier for a non-hydrogen central atom corresponding to all specified radii
187 is generated by concatenating neighborhood identifiers at each radii by colon as a delimiter:
188 .PP
189 .Vb 1
190 \& NR<n>\-<AtomType>\-ATC<n>:NR<n>\-<AtomType>\-ATC<n>:...
191 .Ve
192 .PP
193 The atom neighborhood identifiers for all non-hydrogen central atoms at all specified radii are
194 concatenated using space as a delimiter and constitute atom neighborhood fingerprint of the molecule.
195 .PP
196 Example of \fI\s-1SD\s0\fR file containing atom neighborhood fingerprints string data:
197 .PP
198 .Vb 10
199 \& ... ...
200 \& ... ...
201 \& $$$$
202 \& ... ...
203 \& ... ...
204 \& ... ...
205 \& 41 44 0 0 0 0 0 0 0 0999 V2000
206 \& \-3.3652 1.4499 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
207 \& ... ...
208 \& 2 3 1 0 0 0 0
209 \& ... ...
210 \& M END
211 \& > <CmpdID>
212 \& Cmpd1
213 \&
214 \& > <AtomNeighborhoodsFingerprints>
215 \& FingerprintsVector;AtomNeighborhoods:AtomicInvariantsAtomTypes:MinRadiu
216 \& s0:MaxRadius2;41;AlphaNumericalValues;ValuesString;NR0\-C.X1.BO1.H3\-ATC1
217 \& :NR1\-C.X3.BO3.H1\-ATC1:NR2\-C.X1.BO1.H3\-ATC1:NR2\-C.X3.BO4\-ATC1 NR0\-C.X1.B
218 \& O1.H3\-ATC1:NR1\-C.X3.BO3.H1\-ATC1:NR2\-C.X1.BO1.H3\-ATC1:NR2\-C.X3.BO4\-ATC1
219 \& NR0\-C.X2.BO2.H2\-ATC1:NR1\-C.X2.BO2.H2\-ATC1:NR1\-C.X3.BO3.H1\-ATC1:NR2\-C...
220 \&
221 \& $$$$
222 \& ... ...
223 \& ... ...
224 .Ve
225 .PP
226 Example of \fI\s-1FP\s0\fR file containing atom neighborhood fingerprints string data:
227 .PP
228 .Vb 10
229 \& #
230 \& # Package = MayaChemTools 7.4
231 \& # Release Date = Oct 21, 2010
232 \& #
233 \& # TimeStamp = Fri Mar 11 14:15:27 2011
234 \& #
235 \& # FingerprintsStringType = FingerprintsVector
236 \& #
237 \& # Description = AtomNeighborhoods:AtomicInvariantsAtomTypes:MinRadiu...
238 \& # VectorStringFormat = ValuesString
239 \& # VectorValuesType = AlphaNumericalValues
240 \& #
241 \& Cmpd1 41;NR0\-C.X1.BO1.H3\-ATC1:NR1\-C.X3.BO3.H1\-ATC1:NR2\-C.X1.BO1.H3\-A...
242 \& Cmpd2 23;NR0\-C.X1.BO1.H3\-ATC1:NR1\-C.X2.BO2.H2\-ATC1:NR2\-C.X3.BO3.H1\-A...
243 \& ... ...
244 \& ... ..
245 .Ve
246 .PP
247 Example of \s-1CSV\s0 \fIText\fR file containing atom neighborhood fingerprints string data:
248 .PP
249 .Vb 8
250 \& "CompoundID","AtomNeighborhoodsFingerprints"
251 \& "Cmpd1","FingerprintsVector;AtomNeighborhoods:AtomicInvariantsAtomTypes
252 \& :MinRadius0:MaxRadius2;41;AlphaNumericalValues;ValuesString;NR0\-C.X1.B
253 \& O1.H3\-ATC1:NR1\-C.X3.BO3.H1\-ATC1:NR2\-C.X1.BO1.H3\-ATC1:NR2\-C.X3.BO4\-ATC1
254 \& NR0\-C.X1.BO1.H3\-ATC1:NR1\-C.X3.BO3.H1\-ATC1:NR2\-C.X1.BO1.H3\-ATC1:NR2\-C.X3
255 \& .BO4\-ATC1 NR0\-C.X2.BO2.H2\-ATC1:NR1\-C.X2.BO2.H2\-ATC1:NR1\-C.X3.BO3.H1..."
256 \& ... ...
257 \& ... ...
258 .Ve
259 .PP
260 The current release of MayaChemTools generates the following types of atom neighborhoods
261 fingerprints vector strings:
262 .PP
263 .Vb 6
264 \& FingerprintsVector;AtomNeighborhoods:AtomicInvariantsAtomTypes:MinRadi
265 \& us0:MaxRadius2;41;AlphaNumericalValues;ValuesString;NR0\-C.X1.BO1.H3\-AT
266 \& C1:NR1\-C.X3.BO3.H1\-ATC1:NR2\-C.X1.BO1.H3\-ATC1:NR2\-C.X3.BO4\-ATC1 NR0\-C.X
267 \& 1.BO1.H3\-ATC1:NR1\-C.X3.BO3.H1\-ATC1:NR2\-C.X1.BO1.H3\-ATC1:NR2\-C.X3.BO4\-A
268 \& TC1 NR0\-C.X2.BO2.H2\-ATC1:NR1\-C.X2.BO2.H2\-ATC1:NR1\-C.X3.BO3.H1\-ATC1:NR2
269 \& \-C.X2.BO2.H2\-ATC1:NR2\-N.X3.BO3\-ATC1:NR2\-O.X1.BO1.H1\-ATC1 NR0\-C.X2.B...
270 \&
271 \& FingerprintsVector;AtomNeighborhoods:DREIDINGAtomTypes:MinRadius0:MaxR
272 \& adius2;41;AlphaNumericalValues;ValuesString;NR0\-C_2\-ATC1:NR1\-C_3\-ATC1:
273 \& NR1\-O_2\-ATC1:NR1\-O_3\-ATC1:NR2\-C_3\-ATC1 NR0\-C_2\-ATC1:NR1\-C_R\-ATC1:NR1\-N
274 \& _3\-ATC1:NR1\-O_2\-ATC1:NR2\-C_R\-ATC3 NR0\-C_3\-ATC1:NR1\-C_2\-ATC1:NR1\-C_3\-AT
275 \& C1:NR2\-C_3\-ATC1:NR2\-O_2\-ATC1:NR2\-O_3\-ATC2 NR0\-C_3\-ATC1:NR1\-C_3\-ATC1:NR
276 \& 1\-N_R\-ATC1:NR2\-C_3\-ATC1:NR2\-C_R\-ATC2 NR0\-C_3\-ATC1:NR1\-C_3\-ATC1:NR2\-...
277 \&
278 \& FingerprintsVector;AtomNeighborhoods:EStateAtomTypes:MinRadius0:MaxRad
279 \& ius2;41;AlphaNumericalValues;ValuesString;NR0\-aaCH\-ATC1:NR1\-aaCH\-ATC1:
280 \& NR1\-aasC\-ATC1:NR2\-aaCH\-ATC1:NR2\-aasC\-ATC1:NR2\-sF\-ATC1 NR0\-aaCH\-ATC1:NR
281 \& 1\-aaCH\-ATC1:NR1\-aasC\-ATC1:NR2\-aaCH\-ATC1:NR2\-aasC\-ATC1:NR2\-sF\-ATC1 NR0\-
282 \& aaCH\-ATC1:NR1\-aaCH\-ATC1:NR1\-aasC\-ATC1:NR2\-aaCH\-ATC1:NR2\-aasC\-ATC2 NR0\-
283 \& aaCH\-ATC1:NR1\-aaCH\-ATC1:NR1\-aasC\-ATC1:NR2\-aaCH\-ATC1:NR2\-aasC\-ATC2 N...
284 \&
285 \& FingerprintsVector;AtomNeighborhoods:FunctionalClassAtomTypes:MinRadiu
286 \& s0:MaxRadius2;41;AlphaNumericalValues;ValuesString;NR0\-Ar\-ATC1:NR1\-Ar\-
287 \& ATC1:NR1\-Ar.HBA\-ATC1:NR1\-None\-ATC1:NR2\-Ar\-ATC2:NR2\-None\-ATC4 NR0\-Ar\-AT
288 \& C1:NR1\-Ar\-ATC2:NR1\-Ar.HBA\-ATC1:NR2\-Ar\-ATC5:NR2\-None\-ATC1 NR0\-Ar\-ATC1:N
289 \& R1\-Ar\-ATC2:NR1\-HBD\-ATC1:NR2\-Ar\-ATC2:NR2\-None\-ATC1 NR0\-Ar\-ATC1:NR1\-Ar\-A
290 \& TC2:NR1\-Hal\-ATC1:NR2\-Ar\-ATC2 NR0\-Ar\-ATC1:NR1\-Ar\-ATC2:NR1\-None\-ATC1:...
291 \&
292 \& FingerprintsVector;AtomNeighborhoods:MMFF94AtomTypes:MinRadius0:MaxRad
293 \& ius2;41;AlphaNumericalValues;ValuesString;NR0\-C5A\-ATC1:NR1\-C5B\-ATC1:NR
294 \& 1\-CB\-ATC1:NR1\-N5\-ATC1:NR2\-C5A\-ATC1:NR2\-C5B\-ATC1:NR2\-CB\-ATC3:NR2\-CR\-ATC
295 \& 1 NR0\-C5A\-ATC1:NR1\-C5B\-ATC1:NR1\-CR\-ATC1:NR1\-N5\-ATC1:NR2\-C5A\-ATC1:NR2\-C
296 \& 5B\-ATC1:NR2\-C=ON\-ATC1:NR2\-CR\-ATC3 NR0\-C5B\-ATC1:NR1\-C5A\-ATC1:NR1\-C5B\-AT
297 \& C1:NR1\-C=ON\-ATC1:NR2\-C5A\-ATC1:NR2\-CB\-ATC1:NR2\-CR\-ATC1:NR2\-N5\-ATC1:N...
298 \&
299 \& FingerprintsVector;AtomNeighborhoods:SLogPAtomTypes:MinRadius0:MaxRadi
300 \& us2;41;AlphaNumericalValues;ValuesString;NR0\-C1\-ATC1:NR1\-C10\-ATC1:NR1\-
301 \& CS\-ATC1:NR2\-C1\-ATC1:NR2\-N11\-ATC1:NR2\-O2\-ATC1 NR0\-C1\-ATC1:NR1\-C11\-ATC1:
302 \& NR2\-C1\-ATC1:NR2\-C21\-ATC1 NR0\-C1\-ATC1:NR1\-C11\-ATC1:NR2\-C1\-ATC1:NR2\-C21\-
303 \& ATC1 NR0\-C1\-ATC1:NR1\-C5\-ATC1:NR1\-CS\-ATC1:NR2\-C1\-ATC1:NR2\-O2\-ATC2:NR2\-O
304 \& 9\-ATC1 NR0\-C1\-ATC1:NR1\-CS\-ATC2:NR2\-C1\-ATC2:NR2\-O2\-ATC2 NR0\-C10\-ATC1...
305 \&
306 \& FingerprintsVector;AtomNeighborhoods:SYBYLAtomTypes:MinRadius0:MaxRadi
307 \& us2;41;AlphaNumericalValues;ValuesString;NR0\-C.2\-ATC1:NR1\-C.3\-ATC1:NR1
308 \& \-O.co2\-ATC2:NR2\-C.3\-ATC1 NR0\-C.2\-ATC1:NR1\-C.ar\-ATC1:NR1\-N.am\-ATC1:NR1\-
309 \& O.2\-ATC1:NR2\-C.ar\-ATC3 NR0\-C.3\-ATC1:NR1\-C.2\-ATC1:NR1\-C.3\-ATC1:NR2\-C.3\-
310 \& ATC1:NR2\-O.3\-ATC1:NR2\-O.co2\-ATC2 NR0\-C.3\-ATC1:NR1\-C.3\-ATC1:NR1\-N.ar\-AT
311 \& C1:NR2\-C.3\-ATC1:NR2\-C.ar\-ATC2 NR0\-C.3\-ATC1:NR1\-C.3\-ATC1:NR2\-C.3\-ATC...
312 \&
313 \& FingerprintsVector;AtomNeighborhoods:TPSAAtomTypes:MinRadius0:MaxRadiu
314 \& s2;41;AlphaNumericalValues;ValuesString;NR0\-N21\-ATC1:NR1\-None\-ATC3:NR2
315 \& \-None\-ATC5 NR0\-N7\-ATC1:NR1\-None\-ATC2:NR2\-None\-ATC3:NR2\-O3\-ATC1 NR0\-Non
316 \& e\-ATC1:NR1\-N21\-ATC1:NR1\-None\-ATC1:NR2\-None\-ATC3 NR0\-None\-ATC1:NR1\-N21\-
317 \& ATC1:NR1\-None\-ATC2:NR2\-None\-ATC6 NR0\-None\-ATC1:NR1\-N21\-ATC1:NR1\-None\-A
318 \& TC2:NR2\-None\-ATC6 NR0\-None\-ATC1:NR1\-N7\-ATC1:NR1\-None\-ATC1:NR1\-O3\-AT...
319 \&
320 \& FingerprintsVector;AtomNeighborhoods:UFFAtomTypes:MinRadius0:MaxRadius
321 \& 2;41;AlphaNumericalValues;ValuesString;NR0\-C_2\-ATC1:NR1\-C_3\-ATC1:NR1\-O
322 \& _2\-ATC1:NR1\-O_3\-ATC1:NR2\-C_3\-ATC1 NR0\-C_2\-ATC1:NR1\-C_R\-ATC1:NR1\-N_3\-AT
323 \& C1:NR1\-O_2\-ATC1:NR2\-C_R\-ATC3 NR0\-C_3\-ATC1:NR1\-C_2\-ATC1:NR1\-C_3\-ATC1:NR
324 \& 2\-C_3\-ATC1:NR2\-O_2\-ATC1:NR2\-O_3\-ATC2 NR0\-C_3\-ATC1:NR1\-C_3\-ATC1:NR1\-N_R
325 \& \-ATC1:NR2\-C_3\-ATC1:NR2\-C_R\-ATC2 NR0\-C_3\-ATC1:NR1\-C_3\-ATC1:NR2\-C_3\-A...
326 .Ve
327 .SH "OPTIONS"
328 .IX Header "OPTIONS"
329 .IP "\fB\-\-AromaticityModel\fR \fIMDLAromaticityModel | TriposAromaticityModel | MMFFAromaticityModel | ChemAxonBasicAromaticityModel | ChemAxonGeneralAromaticityModel | DaylightAromaticityModel | MayaChemToolsAromaticityModel\fR" 4
330 .IX Item "--AromaticityModel MDLAromaticityModel | TriposAromaticityModel | MMFFAromaticityModel | ChemAxonBasicAromaticityModel | ChemAxonGeneralAromaticityModel | DaylightAromaticityModel | MayaChemToolsAromaticityModel"
331 Specify aromaticity model to use during detection of aromaticity. Possible values in the current
332 release are: \fIMDLAromaticityModel, TriposAromaticityModel, MMFFAromaticityModel,
333 ChemAxonBasicAromaticityModel, ChemAxonGeneralAromaticityModel, DaylightAromaticityModel
334 or MayaChemToolsAromaticityModel\fR. Default value: \fIMayaChemToolsAromaticityModel\fR.
335 .Sp
336 The supported aromaticity model names along with model specific control parameters
337 are defined in \fBAromaticityModelsData.csv\fR, which is distributed with the current release
338 and is available under \fBlib/data\fR directory. \fBMolecule.pm\fR module retrieves data from
339 this file during class instantiation and makes it available to method \fBDetectAromaticity\fR
340 for detecting aromaticity corresponding to a specific model.
341 .IP "\fB\-a, \-\-AtomIdentifierType\fR \fIAtomicInvariantsAtomTypes | DREIDINGAtomTypes | EStateAtomTypes | FunctionalClassAtomTypes | MMFF94AtomTypes | SLogPAtomTypes | SYBYLAtomTypes | TPSAAtomTypes | UFFAtomTypes\fR" 4
342 .IX Item "-a, --AtomIdentifierType AtomicInvariantsAtomTypes | DREIDINGAtomTypes | EStateAtomTypes | FunctionalClassAtomTypes | MMFF94AtomTypes | SLogPAtomTypes | SYBYLAtomTypes | TPSAAtomTypes | UFFAtomTypes"
343 Specify atom identifier type to use for assignment of initial atom identifier to non-hydrogen
344 atoms during calculation of atom neighborhoods fingerprints. Possible values in the current
345 release are: \fIAtomicInvariantsAtomTypes, DREIDINGAtomTypes, EStateAtomTypes,
346 FunctionalClassAtomTypes, MMFF94AtomTypes, SLogPAtomTypes, SYBYLAtomTypes,
347 TPSAAtomTypes, UFFAtomTypes\fR. Default value: \fIAtomicInvariantsAtomTypes\fR.
348 .ie n .IP "\fB\-\-AtomicInvariantsToUse\fR \fI""AtomicInvariant,AtomicInvariant...""\fR" 4
349 .el .IP "\fB\-\-AtomicInvariantsToUse\fR \fI``AtomicInvariant,AtomicInvariant...''\fR" 4
350 .IX Item "--AtomicInvariantsToUse AtomicInvariant,AtomicInvariant..."
351 This value is used during \fIAtomicInvariantsAtomTypes\fR value of \fBa, \-\-AtomIdentifierType\fR
352 option. It's a list of comma separated valid atomic invariant atom types.
353 .Sp
354 Possible values for atomic invariants are: \fI\s-1AS\s0, X, \s-1BO\s0, \s-1LBO\s0, \s-1SB\s0, \s-1DB\s0, \s-1TB\s0,
355 H, Ar, \s-1RA\s0, \s-1FC\s0, \s-1MN\s0, \s-1SM\s0\fR. Default value: \fI\s-1AS\s0,X,BO,H,FC\fR.
356 .Sp
357 The atomic invariants abbreviations correspond to:
358 .Sp
359 .Vb 1
360 \& AS = Atom symbol corresponding to element symbol
361 \&
362 \& X<n> = Number of non\-hydrogen atom neighbors or heavy atoms
363 \& BO<n> = Sum of bond orders to non\-hydrogen atom neighbors or heavy atoms
364 \& LBO<n> = Largest bond order of non\-hydrogen atom neighbors or heavy atoms
365 \& SB<n> = Number of single bonds to non\-hydrogen atom neighbors or heavy atoms
366 \& DB<n> = Number of double bonds to non\-hydrogen atom neighbors or heavy atoms
367 \& TB<n> = Number of triple bonds to non\-hydrogen atom neighbors or heavy atoms
368 \& H<n> = Number of implicit and explicit hydrogens for atom
369 \& Ar = Aromatic annotation indicating whether atom is aromatic
370 \& RA = Ring atom annotation indicating whether atom is a ring
371 \& FC<+n/\-n> = Formal charge assigned to atom
372 \& MN<n> = Mass number indicating isotope other than most abundant isotope
373 \& SM<n> = Spin multiplicity of atom. Possible values: 1 (singlet), 2 (doublet) or
374 \& 3 (triplet)
375 .Ve
376 .Sp
377 Atom type generated by AtomTypes::AtomicInvariantsAtomTypes class corresponds to:
378 .Sp
379 .Vb 1
380 \& AS.X<n>.BO<n>.LBO<n>.<SB><n>.<DB><n>.<TB><n>.H<n>.Ar.RA.FC<+n/\-n>.MN<n>.SM<n>
381 .Ve
382 .Sp
383 Except for \s-1AS\s0 which is a required atomic invariant in atom types, all other atomic invariants are
384 optional. Atom type specification doesn't include atomic invariants with zero or undefined values.
385 .Sp
386 In addition to usage of abbreviations for specifying atomic invariants, the following descriptive words
387 are also allowed:
388 .Sp
389 .Vb 12
390 \& X : NumOfNonHydrogenAtomNeighbors or NumOfHeavyAtomNeighbors
391 \& BO : SumOfBondOrdersToNonHydrogenAtoms or SumOfBondOrdersToHeavyAtoms
392 \& LBO : LargestBondOrderToNonHydrogenAtoms or LargestBondOrderToHeavyAtoms
393 \& SB : NumOfSingleBondsToNonHydrogenAtoms or NumOfSingleBondsToHeavyAtoms
394 \& DB : NumOfDoubleBondsToNonHydrogenAtoms or NumOfDoubleBondsToHeavyAtoms
395 \& TB : NumOfTripleBondsToNonHydrogenAtoms or NumOfTripleBondsToHeavyAtoms
396 \& H : NumOfImplicitAndExplicitHydrogens
397 \& Ar : Aromatic
398 \& RA : RingAtom
399 \& FC : FormalCharge
400 \& MN : MassNumber
401 \& SM : SpinMultiplicity
402 .Ve
403 .Sp
404 \&\fIAtomTypes::AtomicInvariantsAtomTypes\fR module is used to assign atomic invariant
405 atom types.
406 .ie n .IP "\fB\-\-FunctionalClassesToUse\fR \fI""FunctionalClass1,FunctionalClass2...""\fR" 4
407 .el .IP "\fB\-\-FunctionalClassesToUse\fR \fI``FunctionalClass1,FunctionalClass2...''\fR" 4
408 .IX Item "--FunctionalClassesToUse FunctionalClass1,FunctionalClass2..."
409 This value is used during \fIFunctionalClassAtomTypes\fR value of \fBa, \-\-AtomIdentifierType\fR
410 option. It's a list of comma separated valid functional classes.
411 .Sp
412 Possible values for atom functional classes are: \fIAr, \s-1CA\s0, H, \s-1HBA\s0, \s-1HBD\s0, Hal, \s-1NI\s0, \s-1PI\s0, \s-1RA\s0\fR.
413 Default value [ Ref 24 ]: \fI\s-1HBD\s0,HBA,PI,NI,Ar,Hal\fR.
414 .Sp
415 The functional class abbreviations correspond to:
416 .Sp
417 .Vb 9
418 \& HBD: HydrogenBondDonor
419 \& HBA: HydrogenBondAcceptor
420 \& PI : PositivelyIonizable
421 \& NI : NegativelyIonizable
422 \& Ar : Aromatic
423 \& Hal : Halogen
424 \& H : Hydrophobic
425 \& RA : RingAtom
426 \& CA : ChainAtom
427 \&
428 \& Functional class atom type specification for an atom corresponds to:
429 \&
430 \& Ar.CA.H.HBA.HBD.Hal.NI.PI.RA
431 .Ve
432 .Sp
433 \&\fIAtomTypes::FunctionalClassAtomTypes\fR module is used to assign functional class atom
434 types. It uses following definitions [ Ref 60\-61, Ref 65\-66 ]:
435 .Sp
436 .Vb 4
437 \& HydrogenBondDonor: NH, NH2, OH
438 \& HydrogenBondAcceptor: N[!H], O
439 \& PositivelyIonizable: +, NH2
440 \& NegativelyIonizable: \-, C(=O)OH, S(=O)OH, P(=O)OH
441 .Ve
442 .IP "\fB\-\-CompoundID\fR \fIDataFieldName or LabelPrefixString\fR" 4
443 .IX Item "--CompoundID DataFieldName or LabelPrefixString"
444 This value is \fB\-\-CompoundIDMode\fR specific and indicates how compound \s-1ID\s0 is generated.
445 .Sp
446 For \fIDataField\fR value of \fB\-\-CompoundIDMode\fR option, it corresponds to datafield label name
447 whose value is used as compound \s-1ID\s0; otherwise, it's a prefix string used for generating compound
448 IDs like LabelPrefixString<Number>. Default value, \fICmpd\fR, generates compound IDs which
449 look like Cmpd<Number>.
450 .Sp
451 Examples for \fIDataField\fR value of \fB\-\-CompoundIDMode\fR:
452 .Sp
453 .Vb 2
454 \& MolID
455 \& ExtReg
456 .Ve
457 .Sp
458 Examples for \fILabelPrefix\fR or \fIMolNameOrLabelPrefix\fR value of \fB\-\-CompoundIDMode\fR:
459 .Sp
460 .Vb 1
461 \& Compound
462 .Ve
463 .Sp
464 The value specified above generates compound IDs which correspond to Compound<Number>
465 instead of default value of Cmpd<Number>.
466 .IP "\fB\-\-CompoundIDLabel\fR \fItext\fR" 4
467 .IX Item "--CompoundIDLabel text"
468 Specify compound \s-1ID\s0 column label for \s-1FP\s0 or \s-1CSV/TSV\s0 text file(s) used during \fICompoundID\fR value
469 of \fB\-\-DataFieldsMode\fR option. Default: \fICompoundID\fR.
470 .IP "\fB\-\-CompoundIDMode\fR \fIDataField | MolName | LabelPrefix | MolNameOrLabelPrefix\fR" 4
471 .IX Item "--CompoundIDMode DataField | MolName | LabelPrefix | MolNameOrLabelPrefix"
472 Specify how to generate compound IDs and write to \s-1FP\s0 or \s-1CSV/TSV\s0 text file(s) along with generated
473 fingerprints for \fI\s-1FP\s0 | text | all\fR values of \fB\-\-output\fR option: use a \fISDFile(s)\fR datafield value;
474 use molname line from \fISDFile(s)\fR; generate a sequential \s-1ID\s0 with specific prefix; use combination
475 of both MolName and LabelPrefix with usage of LabelPrefix values for empty molname lines.
476 .Sp
477 Possible values: \fIDataField | MolName | LabelPrefix | MolNameOrLabelPrefix\fR.
478 Default: \fILabelPrefix\fR.
479 .Sp
480 For \fIMolNameAndLabelPrefix\fR value of \fB\-\-CompoundIDMode\fR, molname line in \fISDFile(s)\fR takes
481 precedence over sequential compound IDs generated using \fILabelPrefix\fR and only empty molname
482 values are replaced with sequential compound IDs.
483 .Sp
484 This is only used for \fICompoundID\fR value of \fB\-\-DataFieldsMode\fR option.
485 .ie n .IP "\fB\-\-DataFields\fR \fI""FieldLabel1,FieldLabel2,...""\fR" 4
486 .el .IP "\fB\-\-DataFields\fR \fI``FieldLabel1,FieldLabel2,...''\fR" 4
487 .IX Item "--DataFields FieldLabel1,FieldLabel2,..."
488 Comma delimited list of \fISDFiles(s)\fR data fields to extract and write to \s-1CSV/TSV\s0 text file(s) along
489 with generated fingerprints for \fItext | all\fR values of \fB\-\-output\fR option.
490 .Sp
491 This is only used for \fISpecify\fR value of \fB\-\-DataFieldsMode\fR option.
492 .Sp
493 Examples:
494 .Sp
495 .Vb 2
496 \& Extreg
497 \& MolID,CompoundName
498 .Ve
499 .IP "\fB\-d, \-\-DataFieldsMode\fR \fIAll | Common | Specify | CompoundID\fR" 4
500 .IX Item "-d, --DataFieldsMode All | Common | Specify | CompoundID"
501 Specify how data fields in \fISDFile(s)\fR are transferred to output \s-1CSV/TSV\s0 text file(s) along
502 with generated fingerprints for \fItext | all\fR values of \fB\-\-output\fR option: transfer all \s-1SD\s0
503 data field; transfer \s-1SD\s0 data files common to all compounds; extract specified data fields;
504 generate a compound \s-1ID\s0 using molname line, a compound prefix, or a combination of both.
505 Possible values: \fIAll | Common | specify | CompoundID\fR. Default value: \fICompoundID\fR.
506 .IP "\fB\-f, \-\-Filter\fR \fIYes | No\fR" 4
507 .IX Item "-f, --Filter Yes | No"
508 Specify whether to check and filter compound data in SDFile(s). Possible values: \fIYes or No\fR.
509 Default value: \fIYes\fR.
510 .Sp
511 By default, compound data is checked before calculating fingerprints and compounds containing
512 atom data corresponding to non-element symbols or no atom data are ignored.
513 .IP "\fB\-\-FingerprintsLabel\fR \fItext\fR" 4
514 .IX Item "--FingerprintsLabel text"
515 \&\s-1SD\s0 data label or text file column label to use for fingerprints string in output \s-1SD\s0 or
516 \&\s-1CSV/TSV\s0 text file(s) specified by \fB\-\-output\fR. Default value: \fIAtomNeighborhoodsFingerprints\fR.
517 .IP "\fB\-h, \-\-help\fR" 4
518 .IX Item "-h, --help"
519 Print this help message.
520 .IP "\fB\-k, \-\-KeepLargestComponent\fR \fIYes | No\fR" 4
521 .IX Item "-k, --KeepLargestComponent Yes | No"
522 Generate fingerprints for only the largest component in molecule. Possible values:
523 \&\fIYes or No\fR. Default value: \fIYes\fR.
524 .Sp
525 For molecules containing multiple connected components, fingerprints can be generated
526 in two different ways: use all connected components or just the largest connected
527 component. By default, all atoms except for the largest connected component are
528 deleted before generation of fingerprints.
529 .IP "\fB\-\-MinNeighborhoodRadius\fR \fInumber\fR" 4
530 .IX Item "--MinNeighborhoodRadius number"
531 Minimum atom neighborhood radius for generating atom neighborhoods. Default value: \fI0\fR.
532 Valid values: positive integers and less than \fB\-\-MaxNeighborhoodRadius\fR. Neighborhood
533 radius of zero corresponds to list of non-hydrogen atoms.
534 .IP "\fB\-\-MaxNeighborhoodRadius\fR \fInumber\fR" 4
535 .IX Item "--MaxNeighborhoodRadius number"
536 Maximum atom neighborhood radius for generating atom neighborhoods. Default value: \fI2\fR.
537 Valid values: positive integers and greater than \fB\-\-MineighborhoodRadius\fR.
538 .IP "\fB\-\-OutDelim\fR \fIcomma | tab | semicolon\fR" 4
539 .IX Item "--OutDelim comma | tab | semicolon"
540 Delimiter for output \s-1CSV/TSV\s0 text file(s). Possible values: \fIcomma, tab, or semicolon\fR
541 Default value: \fIcomma\fR.
542 .IP "\fB\-\-output\fR \fI\s-1SD\s0 | \s-1FP\s0 | text | all\fR" 4
543 .IX Item "--output SD | FP | text | all"
544 Type of output files to generate. Possible values: \fI\s-1SD\s0, \s-1FP\s0, text, or all\fR. Default value: \fItext\fR.
545 .IP "\fB\-o, \-\-overwrite\fR" 4
546 .IX Item "-o, --overwrite"
547 Overwrite existing files.
548 .IP "\fB\-q, \-\-quote\fR \fIYes | No\fR" 4
549 .IX Item "-q, --quote Yes | No"
550 Put quote around column values in output \s-1CSV/TSV\s0 text file(s). Possible values:
551 \&\fIYes or No\fR. Default value: \fIYes\fR.
552 .IP "\fB\-r, \-\-root\fR \fIRootName\fR" 4
553 .IX Item "-r, --root RootName"
554 New file name is generated using the root: <Root>.<Ext>. Default for new file names:
555 <SDFileName><AtomNeighborhoodsFP>.<Ext>. The file type determines <Ext>
556 value. The sdf, fpf, csv, and tsv <Ext> values are used for \s-1SD\s0, comma/semicolon, and tab
557 delimited text files, respectively.This option is ignored for multiple input files.
558 .IP "\fB\-w, \-\-WorkingDir\fR \fIDirName\fR" 4
559 .IX Item "-w, --WorkingDir DirName"
560 Location of working directory. Default: current directory.
561 .SH "EXAMPLES"
562 .IX Header "EXAMPLES"
563 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
564 2 using atomic invariants atom types in vector string format and create a SampleANFP.csv
565 file containing sequential compound IDs along with fingerprints vector strings data, type:
566 .PP
567 .Vb 1
568 \& % AtomNeighborhoodsFingerprints.pl \-r SampleANFP \-o Sample.sdf
569 .Ve
570 .PP
571 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
572 2 using \s-1DREIDING\s0 atom types in vector string format and create a SampleANFP.csv
573 file containing sequential compound IDs along with fingerprints vector strings data, type:
574 .PP
575 .Vb 2
576 \& % AtomNeighborhoodsFingerprints.pl \-a DREIDINGAtomTypes \-r SampleANFP
577 \& \-o Sample.sdf
578 .Ve
579 .PP
580 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
581 2 using EStateAtomTypes types in vector string format and create a SampleANFP.csv
582 file containing sequential compound IDs along with fingerprints vector strings data, type:
583 .PP
584 .Vb 2
585 \& % AtomNeighborhoodsFingerprints.pl \-a EStateAtomTypes \-r SampleANFP
586 \& \-o Sample.sdf
587 .Ve
588 .PP
589 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
590 2 using \s-1SYBYL\s0 atom types in vector string format and create a SampleANFP.csv
591 file containing sequential compound IDs along with fingerprints vector strings data, type:
592 .PP
593 .Vb 2
594 \& % AtomNeighborhoodsFingerprints.pl \-a SYBYLAtomTypes \-r SampleANFP
595 \& \-o Sample.sdf
596 .Ve
597 .PP
598 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
599 2 using FunctionalClass atom types in vector string format and create a SampleANFP.csv
600 file containing sequential compound IDs along with fingerprints vector strings data, type:
601 .PP
602 .Vb 2
603 \& % AtomNeighborhoodsFingerprints.pl \-a FunctionalClassAtomTypes
604 \& \-r SampleANFP \-o Sample.sdf
605 .Ve
606 .PP
607 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
608 2 using \s-1MMFF94\s0 atom types in vector string format and create a SampleANFP.csv
609 file containing sequential compound IDs along with fingerprints vector strings data, type:
610 .PP
611 .Vb 2
612 \& % AtomNeighborhoodsFingerprints.pl \-a MMFF94AtomTypes \-r SampleANFP
613 \& \-o Sample.sdf
614 .Ve
615 .PP
616 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
617 2 using SLogP atom types in vector string format and create a SampleANFP.csv
618 file containing sequential compound IDs along with fingerprints vector strings data, type:
619 .PP
620 .Vb 2
621 \& % AtomNeighborhoodsFingerprints.pl \-a SLogPAtomTypes \-r SampleANFP
622 \& \-o Sample.sdf
623 .Ve
624 .PP
625 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
626 2 using \s-1SYBYL\s0 atom types in vector string format and create a SampleANFP.csv
627 file containing sequential compound IDs along with fingerprints vector strings data, type:
628 .PP
629 .Vb 2
630 \& % AtomNeighborhoodsFingerprints.pl \-a SYBYLAtomTypes \-r SampleANFP
631 \& \-o Sample.sdf
632 .Ve
633 .PP
634 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
635 2 using \s-1TPSA\s0 atom types in vector string format and create a SampleANFP.csv
636 file containing sequential compound IDs along with fingerprints vector strings data, type:
637 .PP
638 .Vb 2
639 \& % AtomNeighborhoodsFingerprints.pl \-a TPSAAtomTypes \-r SampleANFP
640 \& \-o Sample.sdf
641 .Ve
642 .PP
643 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
644 2 using \s-1UFF\s0 atom types in vector string format and create a SampleANFP.csv
645 file containing sequential compound IDs along with fingerprints vector strings data, type:
646 .PP
647 .Vb 2
648 \& % AtomNeighborhoodsFingerprints.pl \-a UFFAtomTypes \-r SampleANFP
649 \& \-o Sample.sdf
650 .Ve
651 .PP
652 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
653 2 using atomic invariants atom types in vector string format and create SampleANFP.sdf,
654 SampleANFP.fpf and SampleANFP.csv files containing sequential compound IDs in \s-1CSV\s0 file along
655 with fingerprints vector strings data, type:
656 .PP
657 .Vb 2
658 \& % AtomNeighborhoodsFingerprints.pl \-\-output all \-r SampleANFP
659 \& \-o Sample.sdf
660 .Ve
661 .PP
662 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 1 to
663 3 using atomic invariants atom types in vector string format and create a SampleANFP.csv
664 file containing sequential compound IDs along with fingerprints vector strings data, type:
665 .PP
666 .Vb 3
667 \& % AtomNeighborhoodsFingerprints.pl \-a AtomicInvariantsAtomTypes
668 \& \-\-MinNeighborhoodRadius 1 \-\-MaxNeighborhoodRadius 3 \-r SampleANFP
669 \& \-o Sample.sdf
670 .Ve
671 .PP
672 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
673 2 using only \s-1AS\s0,X atomic invariants atom types in vector string format and create a SampleANFP.csv
674 file containing sequential compound IDs along with fingerprints vector strings data, type:
675 .PP
676 .Vb 3
677 \& % AtomNeighborhoodsFingerprints.pl \-a AtomicInvariantsAtomTypes
678 \& \-\-AtomicInvariantsToUse "AS,X" \-\-MinNeighborhoodRadius 0
679 \& \-\-MaxNeighborhoodRadius 3 \-r SampleANFP \-o Sample.sdf
680 .Ve
681 .PP
682 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
683 2 using atomic invariants atom types in vector string format and create a SampleANFP.csv
684 file containing compound \s-1ID\s0 from molecule name line along with fingerprints vector strings data, type:
685 .PP
686 .Vb 3
687 \& % AtomNeighborhoodsFingerprints.pl \-a AtomicInvariantsAtomTypes
688 \& \-\-DataFieldsMode CompoundID \-\-CompoundIDMode MolName
689 \& \-r SampleANFP \-o Sample.sdf
690 .Ve
691 .PP
692 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
693 2 using atomic invariants atom types in vector string format and create a SampleANFP.csv
694 file containing compound IDs using specified data field along with fingerprints vector strings
695 data, type:
696 .PP
697 .Vb 3
698 \& % AtomNeighborhoodsFingerprints.pl \-a AtomicInvariantsAtomTypes
699 \& \-\-DataFieldsMode CompoundID \-\-CompoundIDMode DataField \-\-CompoundID
700 \& Mol_ID \-r SampleANFP \-o Sample.sdf
701 .Ve
702 .PP
703 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
704 2 using atomic invariants atom types in vector string format and create a SampleANFP.csv
705 file containing compound \s-1ID\s0 using combination of molecule name line and an explicit compound
706 prefix along with fingerprints vector strings data, type:
707 .PP
708 .Vb 3
709 \& % AtomNeighborhoodsFingerprints.pl \-a AtomicInvariantsAtomTypes
710 \& \-\-DataFieldsMode CompoundID \-\-CompoundIDMode MolnameOrLabelPrefix
711 \& \-\-CompoundID Cmpd \-\-CompoundIDLabel MolID \-r SampleANFP \-o Sample.sdf
712 .Ve
713 .PP
714 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
715 2 using atomic invariants atom types in vector string format and create a SampleANFP.csv
716 file containing specific data fields columns along with fingerprints vector strings
717 data, type:
718 .PP
719 .Vb 3
720 \& % AtomNeighborhoodsFingerprints.pl \-a AtomicInvariantsAtomTypes
721 \& \-\-DataFieldsMode Specify \-\-DataFields Mol_ID \-r SampleANFP
722 \& \-o Sample.sdf
723 .Ve
724 .PP
725 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
726 2 using atomic invariants atom types in vector string format and create a SampleANFP.csv
727 file containing common data fields columns along with fingerprints vector strings
728 data, type:
729 .PP
730 .Vb 2
731 \& % AtomNeighborhoodsFingerprints.pl \-a AtomicInvariantsAtomTypes
732 \& \-\-DataFieldsMode Common \-r SampleANFP \-o Sample.sdf
733 .Ve
734 .PP
735 To generate atom neighborhoods fingerprints corresponding to atom neighborhood radii from 0 to
736 2 using atomic invariants atom types in vector string format and create SampleANFP.sdf,
737 SampleANFP.fpf and SampleANFP.csv files containing all data fields columns in \s-1CSV\s0 file along with
738 fingerprints data, type:
739 .PP
740 .Vb 3
741 \& % AtomNeighborhoodsFingerprints.pl \-a AtomicInvariantsAtomTypes
742 \& \-\-DataFieldsMode All \-\-output all \-r SampleANFP
743 \& \-o Sample.sdf
744 .Ve
745 .SH "AUTHOR"
746 .IX Header "AUTHOR"
747 Manish Sud <msud@san.rr.com>
748 .SH "SEE ALSO"
749 .IX Header "SEE ALSO"
750 InfoFingerprintsFiles.pl, SimilarityMatricesFingerprints.pl, SimilaritySearchingFingerprints.pl,
751 ExtendedConnectivityFingerprints.pl, MACCSKeysFingerprints.pl, PathLengthFingerprints.pl,
752 TopologicalAtomPairsFingerprints.pl, TopologicalAtomTorsionsFingerprints.pl,
753 TopologicalPharmacophoreAtomPairsFingerprints.pl, TopologicalPharmacophoreAtomTripletsFingerprints.pl
754 .SH "COPYRIGHT"
755 .IX Header "COPYRIGHT"
756 Copyright (C) 2015 Manish Sud. All rights reserved.
757 .PP
758 This file is part of MayaChemTools.
759 .PP
760 MayaChemTools is free software; you can redistribute it and/or modify it under
761 the terms of the \s-1GNU\s0 Lesser General Public License as published by the Free
762 Software Foundation; either version 3 of the License, or (at your option)
763 any later version.