Mercurial > repos > deepakjadmin > mayatool3_test2
comparison docs/scripts/man1/CalculatePhysicochemicalProperties.1 @ 0:4816e4a8ae95 draft default tip
Uploaded
| author | deepakjadmin |
|---|---|
| date | Wed, 20 Jan 2016 09:23:18 -0500 |
| parents | |
| children |
comparison
equal
deleted
inserted
replaced
| -1:000000000000 | 0:4816e4a8ae95 |
|---|---|
| 1 .\" Automatically generated by Pod::Man 2.25 (Pod::Simple 3.22) | |
| 2 .\" | |
| 3 .\" Standard preamble: | |
| 4 .\" ======================================================================== | |
| 5 .de Sp \" Vertical space (when we can't use .PP) | |
| 6 .if t .sp .5v | |
| 7 .if n .sp | |
| 8 .. | |
| 9 .de Vb \" Begin verbatim text | |
| 10 .ft CW | |
| 11 .nf | |
| 12 .ne \\$1 | |
| 13 .. | |
| 14 .de Ve \" End verbatim text | |
| 15 .ft R | |
| 16 .fi | |
| 17 .. | |
| 18 .\" Set up some character translations and predefined strings. \*(-- will | |
| 19 .\" give an unbreakable dash, \*(PI will give pi, \*(L" will give a left | |
| 20 .\" double quote, and \*(R" will give a right double quote. \*(C+ will | |
| 21 .\" give a nicer C++. Capital omega is used to do unbreakable dashes and | |
| 22 .\" therefore won't be available. \*(C` and \*(C' expand to `' in nroff, | |
| 23 .\" nothing in troff, for use with C<>. | |
| 24 .tr \(*W- | |
| 25 .ds C+ C\v'-.1v'\h'-1p'\s-2+\h'-1p'+\s0\v'.1v'\h'-1p' | |
| 26 .ie n \{\ | |
| 27 . ds -- \(*W- | |
| 28 . ds PI pi | |
| 29 . if (\n(.H=4u)&(1m=24u) .ds -- \(*W\h'-12u'\(*W\h'-12u'-\" diablo 10 pitch | |
| 30 . if (\n(.H=4u)&(1m=20u) .ds -- \(*W\h'-12u'\(*W\h'-8u'-\" diablo 12 pitch | |
| 31 . ds L" "" | |
| 32 . ds R" "" | |
| 33 . ds C` "" | |
| 34 . ds C' "" | |
| 35 'br\} | |
| 36 .el\{\ | |
| 37 . ds -- \|\(em\| | |
| 38 . ds PI \(*p | |
| 39 . ds L" `` | |
| 40 . ds R" '' | |
| 41 'br\} | |
| 42 .\" | |
| 43 .\" Escape single quotes in literal strings from groff's Unicode transform. | |
| 44 .ie \n(.g .ds Aq \(aq | |
| 45 .el .ds Aq ' | |
| 46 .\" | |
| 47 .\" If the F register is turned on, we'll generate index entries on stderr for | |
| 48 .\" titles (.TH), headers (.SH), subsections (.SS), items (.Ip), and index | |
| 49 .\" entries marked with X<> in POD. Of course, you'll have to process the | |
| 50 .\" output yourself in some meaningful fashion. | |
| 51 .ie \nF \{\ | |
| 52 . de IX | |
| 53 . tm Index:\\$1\t\\n%\t"\\$2" | |
| 54 .. | |
| 55 . nr % 0 | |
| 56 . rr F | |
| 57 .\} | |
| 58 .el \{\ | |
| 59 . de IX | |
| 60 .. | |
| 61 .\} | |
| 62 .\" | |
| 63 .\" Accent mark definitions (@(#)ms.acc 1.5 88/02/08 SMI; from UCB 4.2). | |
| 64 .\" Fear. Run. Save yourself. No user-serviceable parts. | |
| 65 . \" fudge factors for nroff and troff | |
| 66 .if n \{\ | |
| 67 . ds #H 0 | |
| 68 . ds #V .8m | |
| 69 . ds #F .3m | |
| 70 . ds #[ \f1 | |
| 71 . ds #] \fP | |
| 72 .\} | |
| 73 .if t \{\ | |
| 74 . ds #H ((1u-(\\\\n(.fu%2u))*.13m) | |
| 75 . ds #V .6m | |
| 76 . ds #F 0 | |
| 77 . ds #[ \& | |
| 78 . ds #] \& | |
| 79 .\} | |
| 80 . \" simple accents for nroff and troff | |
| 81 .if n \{\ | |
| 82 . ds ' \& | |
| 83 . ds ` \& | |
| 84 . ds ^ \& | |
| 85 . ds , \& | |
| 86 . ds ~ ~ | |
| 87 . ds / | |
| 88 .\} | |
| 89 .if t \{\ | |
| 90 . ds ' \\k:\h'-(\\n(.wu*8/10-\*(#H)'\'\h"|\\n:u" | |
| 91 . ds ` \\k:\h'-(\\n(.wu*8/10-\*(#H)'\`\h'|\\n:u' | |
| 92 . ds ^ \\k:\h'-(\\n(.wu*10/11-\*(#H)'^\h'|\\n:u' | |
| 93 . ds , \\k:\h'-(\\n(.wu*8/10)',\h'|\\n:u' | |
| 94 . ds ~ \\k:\h'-(\\n(.wu-\*(#H-.1m)'~\h'|\\n:u' | |
| 95 . ds / \\k:\h'-(\\n(.wu*8/10-\*(#H)'\z\(sl\h'|\\n:u' | |
| 96 .\} | |
| 97 . \" troff and (daisy-wheel) nroff accents | |
| 98 .ds : \\k:\h'-(\\n(.wu*8/10-\*(#H+.1m+\*(#F)'\v'-\*(#V'\z.\h'.2m+\*(#F'.\h'|\\n:u'\v'\*(#V' | |
| 99 .ds 8 \h'\*(#H'\(*b\h'-\*(#H' | |
| 100 .ds o \\k:\h'-(\\n(.wu+\w'\(de'u-\*(#H)/2u'\v'-.3n'\*(#[\z\(de\v'.3n'\h'|\\n:u'\*(#] | |
| 101 .ds d- \h'\*(#H'\(pd\h'-\w'~'u'\v'-.25m'\f2\(hy\fP\v'.25m'\h'-\*(#H' | |
| 102 .ds D- D\\k:\h'-\w'D'u'\v'-.11m'\z\(hy\v'.11m'\h'|\\n:u' | |
| 103 .ds th \*(#[\v'.3m'\s+1I\s-1\v'-.3m'\h'-(\w'I'u*2/3)'\s-1o\s+1\*(#] | |
| 104 .ds Th \*(#[\s+2I\s-2\h'-\w'I'u*3/5'\v'-.3m'o\v'.3m'\*(#] | |
| 105 .ds ae a\h'-(\w'a'u*4/10)'e | |
| 106 .ds Ae A\h'-(\w'A'u*4/10)'E | |
| 107 . \" corrections for vroff | |
| 108 .if v .ds ~ \\k:\h'-(\\n(.wu*9/10-\*(#H)'\s-2\u~\d\s+2\h'|\\n:u' | |
| 109 .if v .ds ^ \\k:\h'-(\\n(.wu*10/11-\*(#H)'\v'-.4m'^\v'.4m'\h'|\\n:u' | |
| 110 . \" for low resolution devices (crt and lpr) | |
| 111 .if \n(.H>23 .if \n(.V>19 \ | |
| 112 \{\ | |
| 113 . ds : e | |
| 114 . ds 8 ss | |
| 115 . ds o a | |
| 116 . ds d- d\h'-1'\(ga | |
| 117 . ds D- D\h'-1'\(hy | |
| 118 . ds th \o'bp' | |
| 119 . ds Th \o'LP' | |
| 120 . ds ae ae | |
| 121 . ds Ae AE | |
| 122 .\} | |
| 123 .rm #[ #] #H #V #F C | |
| 124 .\" ======================================================================== | |
| 125 .\" | |
| 126 .IX Title "CALCULATEPHYSICOCHEMICALPROPERTIES 1" | |
| 127 .TH CALCULATEPHYSICOCHEMICALPROPERTIES 1 "2015-03-29" "perl v5.14.2" "MayaChemTools" | |
| 128 .\" For nroff, turn off justification. Always turn off hyphenation; it makes | |
| 129 .\" way too many mistakes in technical documents. | |
| 130 .if n .ad l | |
| 131 .nh | |
| 132 .SH "NAME" | |
| 133 CalculatePhysicochemicalProperties.pl \- Calculate physicochemical properties for SD files | |
| 134 .SH "SYNOPSIS" | |
| 135 .IX Header "SYNOPSIS" | |
| 136 CalculatePhysicochemicalProperties.pl SDFile(s)... | |
| 137 .PP | |
| 138 PhysicochemicalProperties.pl [\fB\-\-AromaticityModel\fR \fIAromaticityModelType\fR] | |
| 139 [\fB\-\-CompoundID\fR DataFieldName or LabelPrefixString] | |
| 140 [\fB\-\-CompoundIDLabel\fR text] [\fB\-\-CompoundIDMode\fR] [\fB\-\-DataFields\fR \*(L"FieldLabel1, FieldLabel2,...\*(R"] | |
| 141 [\fB\-d, \-\-DataFieldsMode\fR All | Common | Specify | CompoundID] [\fB\-f, \-\-Filter\fR Yes | No] [\fB\-h, \-\-help\fR] | |
| 142 [\fB\-\-HydrogenBonds\fR HBondsType1 | HBondsType2] [\fB\-k, \-\-KeepLargestComponent\fR Yes | No] | |
| 143 [\fB\-m, \-\-mode\fR All | RuleOf5 | RuleOf3 | \*(L"name1, [name2,...]\*(R"] | |
| 144 [\fB\-\-MolecularComplexity\fR \fIName,Value, [Name,Value,...]\fR] | |
| 145 [\fB\-\-OutDelim\fR comma | tab | semicolon] [\fB\-\-output\fR \s-1SD\s0 | text | both] [\fB\-o, \-\-overwrite\fR] | |
| 146 [\fB\-\-Precision\fR Name,Number,[Name,Number,..]] [\fB\-\-RotatableBonds\fR Name,Value, [Name,Value,...]] | |
| 147 [\fB\-\-RuleOf3Violations\fR Yes | No] [\fB\-\-RuleOf5Violations\fR Yes | No] | |
| 148 [\fB\-q, \-\-quote\fR Yes | No] [\fB\-r, \-\-root\fR RootName] | |
| 149 [\fB\-w, \-\-WorkingDir\fR dirname] SDFile(s)... | |
| 150 .SH "DESCRIPTION" | |
| 151 .IX Header "DESCRIPTION" | |
| 152 Calculate physicochemical properties for \fISDFile(s)\fR and create appropriate \s-1SD\s0 or \s-1CSV/TSV\s0 | |
| 153 text file(s) containing calculated properties. | |
| 154 .PP | |
| 155 The current release of MayaChemTools supports the calculation of these physicochemical | |
| 156 properties: | |
| 157 .PP | |
| 158 .Vb 7 | |
| 159 \& MolecularWeight, ExactMass, HeavyAtoms, Rings, AromaticRings, | |
| 160 \& van der Waals MolecularVolume [ Ref 93 ], RotatableBonds, | |
| 161 \& HydrogenBondDonors, HydrogenBondAcceptors, LogP and | |
| 162 \& Molar Refractivity (SLogP and SMR) [ Ref 89 ], Topological Polar | |
| 163 \& Surface Area (TPSA) [ Ref 90 ], Fraction of SP3 carbons (Fsp3Carbons) | |
| 164 \& and SP3 carbons (Sp3Carbons) [ Ref 115\-116, Ref 119 ], | |
| 165 \& MolecularComplexity [ Ref 117\-119 ] | |
| 166 .Ve | |
| 167 .PP | |
| 168 Multiple SDFile names are separated by spaces. The valid file extensions are \fI.sdf\fR | |
| 169 and \fI.sd\fR. All other file names are ignored. All the \s-1SD\s0 files in a current directory | |
| 170 can be specified either by \fI*.sdf\fR or the current directory name. | |
| 171 .PP | |
| 172 The calculation of molecular complexity using \fIMolecularComplexityType\fR parameter | |
| 173 corresponds to the number of bits-set or unique keys [ Ref 117\-119 ] in molecular fingerprints. | |
| 174 Default value for \fIMolecularComplexityType\fR: \fIMACCSKeys\fR of size 166. The calculation | |
| 175 of MACCSKeys is relatively expensive and can take rather substantial amount of time. | |
| 176 .SH "OPTIONS" | |
| 177 .IX Header "OPTIONS" | |
| 178 .IP "\fB\-\-AromaticityModel\fR \fIMDLAromaticityModel | TriposAromaticityModel | MMFFAromaticityModel | ChemAxonBasicAromaticityModel | ChemAxonGeneralAromaticityModel | DaylightAromaticityModel | MayaChemToolsAromaticityModel\fR" 4 | |
| 179 .IX Item "--AromaticityModel MDLAromaticityModel | TriposAromaticityModel | MMFFAromaticityModel | ChemAxonBasicAromaticityModel | ChemAxonGeneralAromaticityModel | DaylightAromaticityModel | MayaChemToolsAromaticityModel" | |
| 180 Specify aromaticity model to use during detection of aromaticity. Possible values in the current | |
| 181 release are: \fIMDLAromaticityModel, TriposAromaticityModel, MMFFAromaticityModel, | |
| 182 ChemAxonBasicAromaticityModel, ChemAxonGeneralAromaticityModel, DaylightAromaticityModel | |
| 183 or MayaChemToolsAromaticityModel\fR. Default value: \fIMayaChemToolsAromaticityModel\fR. | |
| 184 .Sp | |
| 185 The supported aromaticity model names along with model specific control parameters | |
| 186 are defined in \fBAromaticityModelsData.csv\fR, which is distributed with the current release | |
| 187 and is available under \fBlib/data\fR directory. \fBMolecule.pm\fR module retrieves data from | |
| 188 this file during class instantiation and makes it available to method \fBDetectAromaticity\fR | |
| 189 for detecting aromaticity corresponding to a specific model. | |
| 190 .IP "\fB\-\-CompoundID\fR \fIDataFieldName or LabelPrefixString\fR" 4 | |
| 191 .IX Item "--CompoundID DataFieldName or LabelPrefixString" | |
| 192 This value is \fB\-\-CompoundIDMode\fR specific and indicates how compound \s-1ID\s0 is generated. | |
| 193 .Sp | |
| 194 For \fIDataField\fR value of \fB\-\-CompoundIDMode\fR option, it corresponds to datafield label name | |
| 195 whose value is used as compound \s-1ID\s0; otherwise, it's a prefix string used for generating compound | |
| 196 IDs like LabelPrefixString<Number>. Default value, \fICmpd\fR, generates compound IDs which | |
| 197 look like Cmpd<Number>. | |
| 198 .Sp | |
| 199 Examples for \fIDataField\fR value of \fB\-\-CompoundIDMode\fR: | |
| 200 .Sp | |
| 201 .Vb 2 | |
| 202 \& MolID | |
| 203 \& ExtReg | |
| 204 .Ve | |
| 205 .Sp | |
| 206 Examples for \fILabelPrefix\fR or \fIMolNameOrLabelPrefix\fR value of \fB\-\-CompoundIDMode\fR: | |
| 207 .Sp | |
| 208 .Vb 1 | |
| 209 \& Compound | |
| 210 .Ve | |
| 211 .Sp | |
| 212 The value specified above generates compound IDs which correspond to Compound<Number> | |
| 213 instead of default value of Cmpd<Number>. | |
| 214 .IP "\fB\-\-CompoundIDLabel\fR \fItext\fR" 4 | |
| 215 .IX Item "--CompoundIDLabel text" | |
| 216 Specify compound \s-1ID\s0 column label for \s-1CSV/TSV\s0 text file(s) used during \fICompoundID\fR value | |
| 217 of \fB\-\-DataFieldsMode\fR option. Default value: \fICompoundID\fR. | |
| 218 .IP "\fB\-\-CompoundIDMode\fR \fIDataField | MolName | LabelPrefix | MolNameOrLabelPrefix\fR" 4 | |
| 219 .IX Item "--CompoundIDMode DataField | MolName | LabelPrefix | MolNameOrLabelPrefix" | |
| 220 Specify how to generate compound IDs and write to \s-1CSV/TSV\s0 text file(s) along with calculated | |
| 221 physicochemical properties for \fItext | both\fR values of \fB\-\-output\fR option: use a \fISDFile(s)\fR | |
| 222 datafield value; use molname line from \fISDFile(s)\fR; generate a sequential \s-1ID\s0 with specific prefix; | |
| 223 use combination of both MolName and LabelPrefix with usage of LabelPrefix values for empty | |
| 224 molname lines. | |
| 225 .Sp | |
| 226 Possible values: \fIDataField | MolName | LabelPrefix | MolNameOrLabelPrefix\fR. | |
| 227 Default value: \fILabelPrefix\fR. | |
| 228 .Sp | |
| 229 For \fIMolNameAndLabelPrefix\fR value of \fB\-\-CompoundIDMode\fR, molname line in \fISDFile(s)\fR takes | |
| 230 precedence over sequential compound IDs generated using \fILabelPrefix\fR and only empty molname | |
| 231 values are replaced with sequential compound IDs. | |
| 232 .Sp | |
| 233 This is only used for \fICompoundID\fR value of \fB\-\-DataFieldsMode\fR option. | |
| 234 .ie n .IP "\fB\-\-DataFields\fR \fI""FieldLabel1,FieldLabel2,...""\fR" 4 | |
| 235 .el .IP "\fB\-\-DataFields\fR \fI``FieldLabel1,FieldLabel2,...''\fR" 4 | |
| 236 .IX Item "--DataFields FieldLabel1,FieldLabel2,..." | |
| 237 Comma delimited list of \fISDFiles(s)\fR data fields to extract and write to \s-1CSV/TSV\s0 text file(s) along | |
| 238 with calculated physicochemical properties for \fItext | both\fR values of \fB\-\-output\fR option. | |
| 239 .Sp | |
| 240 This is only used for \fISpecify\fR value of \fB\-\-DataFieldsMode\fR option. | |
| 241 .Sp | |
| 242 Examples: | |
| 243 .Sp | |
| 244 .Vb 2 | |
| 245 \& Extreg | |
| 246 \& MolID,CompoundName | |
| 247 .Ve | |
| 248 .IP "\fB\-d, \-\-DataFieldsMode\fR \fIAll | Common | Specify | CompoundID\fR" 4 | |
| 249 .IX Item "-d, --DataFieldsMode All | Common | Specify | CompoundID" | |
| 250 Specify how data fields in \fISDFile(s)\fR are transferred to output \s-1CSV/TSV\s0 text file(s) along | |
| 251 with calculated physicochemical properties for \fItext | both\fR values of \fB\-\-output\fR option: | |
| 252 transfer all \s-1SD\s0 data field; transfer \s-1SD\s0 data files common to all compounds; extract specified | |
| 253 data fields; generate a compound \s-1ID\s0 using molname line, a compound prefix, or a combination | |
| 254 of both. Possible values: \fIAll | Common | specify | CompoundID\fR. Default value: \fICompoundID\fR. | |
| 255 .IP "\fB\-f, \-\-Filter\fR \fIYes | No\fR" 4 | |
| 256 .IX Item "-f, --Filter Yes | No" | |
| 257 Specify whether to check and filter compound data in SDFile(s). Possible values: \fIYes or No\fR. | |
| 258 Default value: \fIYes\fR. | |
| 259 .Sp | |
| 260 By default, compound data is checked before calculating physiochemical properties and compounds | |
| 261 containing atom data corresponding to non-element symbols or no atom data are ignored. | |
| 262 .IP "\fB\-h, \-\-help\fR" 4 | |
| 263 .IX Item "-h, --help" | |
| 264 Print this help message. | |
| 265 .IP "\fB\-\-HydrogenBonds\fR \fIHBondsType1 | HBondsType2\fR" 4 | |
| 266 .IX Item "--HydrogenBonds HBondsType1 | HBondsType2" | |
| 267 Parameters to control calculation of hydrogen bond donors and acceptors. Possible values: | |
| 268 \&\fIHBondsType1, HydrogenBondsType1, HBondsType2, HydrogenBondsType2\fR. Default value: | |
| 269 \&\fIHBondsType2\fR which corresponds to \fBRuleOf5\fR definition for number of hydrogen bond | |
| 270 donors and acceptors. | |
| 271 .Sp | |
| 272 The current release of MayaChemTools supports identification of two types of hydrogen bond | |
| 273 donor and acceptor atoms with these names: | |
| 274 .Sp | |
| 275 .Vb 2 | |
| 276 \& HBondsType1 or HydrogenBondsType1 | |
| 277 \& HBondsType2 or HydrogenBondsType2 | |
| 278 .Ve | |
| 279 .Sp | |
| 280 The names of these hydrogen bond types are rather arbitrary. However, their definitions have | |
| 281 specific meaning and are as follows: | |
| 282 .Sp | |
| 283 .Vb 1 | |
| 284 \& HydrogenBondsType1 [ Ref 60\-61, Ref 65\-66 ]: | |
| 285 \& | |
| 286 \& Donor: NH, NH2, OH \- Any N and O with available H | |
| 287 \& Acceptor: N[!H], O \- Any N without available H and any O | |
| 288 \& | |
| 289 \& HydrogenBondsType2 [ Ref 91 ]: | |
| 290 \& | |
| 291 \& Donor: NH, NH2, OH \- N and O with available H | |
| 292 \& Acceptor: N, O \- And N and O | |
| 293 .Ve | |
| 294 .IP "\fB\-k, \-\-KeepLargestComponent\fR \fIYes | No\fR" 4 | |
| 295 .IX Item "-k, --KeepLargestComponent Yes | No" | |
| 296 Calculate physicochemical properties for only the largest component in molecule. Possible values: | |
| 297 \&\fIYes or No\fR. Default value: \fIYes\fR. | |
| 298 .Sp | |
| 299 For molecules containing multiple connected components, physicochemical properties can be | |
| 300 calculated in two different ways: use all connected components or just the largest connected | |
| 301 component. By default, all atoms except for the largest connected component are | |
| 302 deleted before calculation of physicochemical properties. | |
| 303 .ie n .IP "\fB\-m, \-\-mode\fR \fIAll | RuleOf5 | RuleOf3 | ""name1, [name2,...]""\fR" 4 | |
| 304 .el .IP "\fB\-m, \-\-mode\fR \fIAll | RuleOf5 | RuleOf3 | ``name1, [name2,...]''\fR" 4 | |
| 305 .IX Item "-m, --mode All | RuleOf5 | RuleOf3 | name1, [name2,...]" | |
| 306 Specify physicochemical properties to calculate for SDFile(s): calculate all available physical | |
| 307 chemical properties; calculate properties corresponding to Rule of 5; or use a comma delimited | |
| 308 list of supported physicochemical properties. Possible values: \fIAll | RuleOf5 | RuleOf3 | | |
| 309 \&\*(L"name1, [name2,...]\*(R"\fR. | |
| 310 .Sp | |
| 311 Default value: \fIMolecularWeight, HeavyAtoms, MolecularVolume, RotatableBonds, HydrogenBondDonors, | |
| 312 HydrogenBondAcceptors, SLogP, \s-1TPSA\s0\fR. These properties are calculated by default. | |
| 313 .Sp | |
| 314 \&\fIRuleOf5\fR [ Ref 91 ] includes these properties: \fIMolecularWeight, HydrogenBondDonors, HydrogenBondAcceptors, | |
| 315 SLogP\fR. \fIRuleOf5\fR states: MolecularWeight <= 500, HydrogenBondDonors <= 5, HydrogenBondAcceptors <= 10, and | |
| 316 logP <= 5. | |
| 317 .Sp | |
| 318 \&\fIRuleOf3\fR [ Ref 92 ] includes these properties: \fIMolecularWeight, RotatableBonds, HydrogenBondDonors, | |
| 319 HydrogenBondAcceptors, SLogP, \s-1TPSA\s0\fR. \fIRuleOf3\fR states: MolecularWeight <= 300, RotatableBonds <= 3, | |
| 320 HydrogenBondDonors <= 3, HydrogenBondAcceptors <= 3, logP <= 3, and \s-1TPSA\s0 <= 60. | |
| 321 .Sp | |
| 322 \&\fIAll\fR calculates all supported physicochemical properties: \fIMolecularWeight, ExactMass, | |
| 323 HeavyAtoms, Rings, AromaticRings, MolecularVolume, RotatableBonds, HydrogenBondDonors, | |
| 324 HydrogenBondAcceptors, SLogP, \s-1SMR\s0, \s-1TPSA\s0, Fsp3Carbons, Sp3Carbons, MolecularComplexity\fR. | |
| 325 .IP "\fB\-\-MolecularComplexity\fR \fIName,Value, [Name,Value,...]\fR" 4 | |
| 326 .IX Item "--MolecularComplexity Name,Value, [Name,Value,...]" | |
| 327 Parameters to control calculation of molecular complexity: it's a comma delimited list of parameter | |
| 328 name and value pairs. | |
| 329 .Sp | |
| 330 Possible parameter names: \fIMolecularComplexityType, AtomIdentifierType, | |
| 331 AtomicInvariantsToUse, FunctionalClassesToUse, MACCSKeysSize, NeighborhoodRadius, | |
| 332 MinPathLength, MaxPathLength, UseBondSymbols, MinDistance, MaxDistance, | |
| 333 UseTriangleInequality, DistanceBinSize, NormalizationMethodology\fR. | |
| 334 .Sp | |
| 335 The valid paramater valuse for each parameter name are described in the following sections. | |
| 336 .Sp | |
| 337 The current release of MayaChemTools supports calculation of molecular complexity using | |
| 338 \&\fIMolecularComplexityType\fR parameter corresponding to the number of bits-set or unique | |
| 339 keys [ Ref 117\-119 ] in molecular fingerprints. The valid values for \fIMolecularComplexityType\fR | |
| 340 are: | |
| 341 .Sp | |
| 342 .Vb 9 | |
| 343 \& AtomTypesFingerprints | |
| 344 \& ExtendedConnectivityFingerprints | |
| 345 \& MACCSKeys | |
| 346 \& PathLengthFingerprints | |
| 347 \& TopologicalAtomPairsFingerprints | |
| 348 \& TopologicalAtomTripletsFingerprints | |
| 349 \& TopologicalAtomTorsionsFingerprints | |
| 350 \& TopologicalPharmacophoreAtomPairsFingerprints | |
| 351 \& TopologicalPharmacophoreAtomTripletsFingerprints | |
| 352 .Ve | |
| 353 .Sp | |
| 354 Default value for \fIMolecularComplexityType\fR: \fIMACCSKeys\fR. | |
| 355 .Sp | |
| 356 \&\fIAtomIdentifierType\fR parameter name correspods to atom types used during generation of | |
| 357 fingerprints. The valid values for \fIAtomIdentifierType\fR are: \fIAtomicInvariantsAtomTypes, | |
| 358 DREIDINGAtomTypes, EStateAtomTypes, FunctionalClassAtomTypes, MMFF94AtomTypes, | |
| 359 SLogPAtomTypes, SYBYLAtomTypes, TPSAAtomTypes, UFFAtomTypes\fR. \fIAtomicInvariantsAtomTypes\fR | |
| 360 is not supported for during the following values of \fIMolecularComplexityType\fR: \fIMACCSKeys, | |
| 361 TopologicalPharmacophoreAtomPairsFingerprints, TopologicalPharmacophoreAtomTripletsFingerprints\fR. | |
| 362 \&\fIFunctionalClassAtomTypes\fR is the only valid value for \fIAtomIdentifierType\fR for topological | |
| 363 pharmacophore fingerprints. | |
| 364 .Sp | |
| 365 Default value for \fIAtomIdentifierType\fR: \fIAtomicInvariantsAtomTypes\fR | |
| 366 for all except topological pharmacophore fingerprints where it is \fIFunctionalClassAtomTypes\fR. | |
| 367 .Sp | |
| 368 \&\fIAtomicInvariantsToUse\fR parameter name and values are used during \fIAtomicInvariantsAtomTypes\fR | |
| 369 value of parameter \fIAtomIdentifierType\fR. It's a list of space separated valid atomic invariant atom types. | |
| 370 .Sp | |
| 371 Possible values for atomic invariants are: \fI\s-1AS\s0, X, \s-1BO\s0, \s-1LBO\s0, \s-1SB\s0, \s-1DB\s0, \s-1TB\s0, H, Ar, \s-1RA\s0, \s-1FC\s0, \s-1MN\s0, \s-1SM\s0\fR. | |
| 372 Default value for \fIAtomicInvariantsToUse\fR parameter are set differently for different fingerprints | |
| 373 using \fIMolecularComplexityType\fR parameter as shown below: | |
| 374 .Sp | |
| 375 .Vb 1 | |
| 376 \& MolecularComplexityType AtomicInvariantsToUse | |
| 377 \& | |
| 378 \& AtomTypesFingerprints AS X BO H FC | |
| 379 \& TopologicalAtomPairsFingerprints AS X BO H FC | |
| 380 \& TopologicalAtomTripletsFingerprints AS X BO H FC | |
| 381 \& TopologicalAtomTorsionsFingerprints AS X BO H FC | |
| 382 \& | |
| 383 \& ExtendedConnectivityFingerprints AS X BO H FC MN | |
| 384 \& PathLengthFingerprints AS | |
| 385 .Ve | |
| 386 .Sp | |
| 387 The atomic invariants abbreviations correspond to: | |
| 388 .Sp | |
| 389 .Vb 1 | |
| 390 \& AS = Atom symbol corresponding to element symbol | |
| 391 \& | |
| 392 \& X<n> = Number of non\-hydrogen atom neighbors or heavy atoms | |
| 393 \& BO<n> = Sum of bond orders to non\-hydrogen atom neighbors or heavy atoms | |
| 394 \& LBO<n> = Largest bond order of non\-hydrogen atom neighbors or heavy atoms | |
| 395 \& SB<n> = Number of single bonds to non\-hydrogen atom neighbors or heavy atoms | |
| 396 \& DB<n> = Number of double bonds to non\-hydrogen atom neighbors or heavy atoms | |
| 397 \& TB<n> = Number of triple bonds to non\-hydrogen atom neighbors or heavy atoms | |
| 398 \& H<n> = Number of implicit and explicit hydrogens for atom | |
| 399 \& Ar = Aromatic annotation indicating whether atom is aromatic | |
| 400 \& RA = Ring atom annotation indicating whether atom is a ring | |
| 401 \& FC<+n/\-n> = Formal charge assigned to atom | |
| 402 \& MN<n> = Mass number indicating isotope other than most abundant isotope | |
| 403 \& SM<n> = Spin multiplicity of atom. Possible values: 1 (singlet), 2 (doublet) or | |
| 404 \& 3 (triplet) | |
| 405 .Ve | |
| 406 .Sp | |
| 407 Atom type generated by AtomTypes::AtomicInvariantsAtomTypes class corresponds to: | |
| 408 .Sp | |
| 409 .Vb 1 | |
| 410 \& AS.X<n>.BO<n>.LBO<n>.<SB><n>.<DB><n>.<TB><n>.H<n>.Ar.RA.FC<+n/\-n>.MN<n>.SM<n> | |
| 411 .Ve | |
| 412 .Sp | |
| 413 Except for \s-1AS\s0 which is a required atomic invariant in atom types, all other atomic invariants are | |
| 414 optional. Atom type specification doesn't include atomic invariants with zero or undefined values. | |
| 415 .Sp | |
| 416 In addition to usage of abbreviations for specifying atomic invariants, the following descriptive words | |
| 417 are also allowed: | |
| 418 .Sp | |
| 419 .Vb 12 | |
| 420 \& X : NumOfNonHydrogenAtomNeighbors or NumOfHeavyAtomNeighbors | |
| 421 \& BO : SumOfBondOrdersToNonHydrogenAtoms or SumOfBondOrdersToHeavyAtoms | |
| 422 \& LBO : LargestBondOrderToNonHydrogenAtoms or LargestBondOrderToHeavyAtoms | |
| 423 \& SB : NumOfSingleBondsToNonHydrogenAtoms or NumOfSingleBondsToHeavyAtoms | |
| 424 \& DB : NumOfDoubleBondsToNonHydrogenAtoms or NumOfDoubleBondsToHeavyAtoms | |
| 425 \& TB : NumOfTripleBondsToNonHydrogenAtoms or NumOfTripleBondsToHeavyAtoms | |
| 426 \& H : NumOfImplicitAndExplicitHydrogens | |
| 427 \& Ar : Aromatic | |
| 428 \& RA : RingAtom | |
| 429 \& FC : FormalCharge | |
| 430 \& MN : MassNumber | |
| 431 \& SM : SpinMultiplicity | |
| 432 .Ve | |
| 433 .Sp | |
| 434 \&\fIAtomTypes::AtomicInvariantsAtomTypes\fR module is used to assign atomic invariant | |
| 435 atom types. | |
| 436 .Sp | |
| 437 \&\fIFunctionalClassesToUse\fR parameter name and values are used during \fIFunctionalClassAtomTypes\fR | |
| 438 value of parameter \fIAtomIdentifierType\fR. It's a list of space separated valid atomic invariant atom types. | |
| 439 .Sp | |
| 440 Possible values for atom functional classes are: \fIAr, \s-1CA\s0, H, \s-1HBA\s0, \s-1HBD\s0, Hal, \s-1NI\s0, \s-1PI\s0, \s-1RA\s0\fR. | |
| 441 .Sp | |
| 442 Default value for \fIFunctionalClassesToUse\fR parameter is set to: | |
| 443 .Sp | |
| 444 .Vb 1 | |
| 445 \& HBD HBA PI NI Ar Hal | |
| 446 .Ve | |
| 447 .Sp | |
| 448 for all fingerprints except for the following two \fIMolecularComplexityType\fR fingerints: | |
| 449 .Sp | |
| 450 .Vb 1 | |
| 451 \& MolecularComplexityType FunctionalClassesToUse | |
| 452 \& | |
| 453 \& TopologicalPharmacophoreAtomPairsFingerprints HBD HBA P, NI H | |
| 454 \& TopologicalPharmacophoreAtomTripletsFingerprints HBD HBA PI NI H Ar | |
| 455 .Ve | |
| 456 .Sp | |
| 457 The functional class abbreviations correspond to: | |
| 458 .Sp | |
| 459 .Vb 9 | |
| 460 \& HBD: HydrogenBondDonor | |
| 461 \& HBA: HydrogenBondAcceptor | |
| 462 \& PI : PositivelyIonizable | |
| 463 \& NI : NegativelyIonizable | |
| 464 \& Ar : Aromatic | |
| 465 \& Hal : Halogen | |
| 466 \& H : Hydrophobic | |
| 467 \& RA : RingAtom | |
| 468 \& CA : ChainAtom | |
| 469 \& | |
| 470 \& Functional class atom type specification for an atom corresponds to: | |
| 471 \& | |
| 472 \& Ar.CA.H.HBA.HBD.Hal.NI.PI.RA | |
| 473 .Ve | |
| 474 .Sp | |
| 475 \&\fIAtomTypes::FunctionalClassAtomTypes\fR module is used to assign functional class atom | |
| 476 types. It uses following definitions [ Ref 60\-61, Ref 65\-66 ]: | |
| 477 .Sp | |
| 478 .Vb 4 | |
| 479 \& HydrogenBondDonor: NH, NH2, OH | |
| 480 \& HydrogenBondAcceptor: N[!H], O | |
| 481 \& PositivelyIonizable: +, NH2 | |
| 482 \& NegativelyIonizable: \-, C(=O)OH, S(=O)OH, P(=O)OH | |
| 483 .Ve | |
| 484 .Sp | |
| 485 \&\fIMACCSKeysSize\fR parameter name is only used during \fIMACCSKeys\fR value of | |
| 486 \&\fIMolecularComplexityType\fR and corresponds to the size of \s-1MACCS\s0 key set. Possible | |
| 487 values: \fI166 or 322\fR. Default value: \fI166\fR. | |
| 488 .Sp | |
| 489 \&\fINeighborhoodRadius\fR parameter name is only used during \fIExtendedConnectivityFingerprints\fR | |
| 490 value of \fIMolecularComplexityType\fR and corresponds to atomic neighborhoods radius for | |
| 491 generating extended connectivity fingerprints. Possible values: positive integer. Default value: | |
| 492 \&\fI2\fR. | |
| 493 .Sp | |
| 494 \&\fIMinPathLength\fR and \fIMaxPathLength\fR parameters are only used during \fIPathLengthFingerprints\fR | |
| 495 value of \fIMolecularComplexityType\fR and correspond to minimum and maximum path lengths to use | |
| 496 for generating path length fingerprints. Possible values: positive integers. Default value: \fIMinPathLength \- 1\fR; | |
| 497 \&\fIMaxPathLength \- 8\fR. | |
| 498 .Sp | |
| 499 \&\fIUseBondSymbols\fR parameter is only used during \fIPathLengthFingerprints\fR value of | |
| 500 \&\fIMolecularComplexityType\fR and indicates whether bond symbols are included in atom path | |
| 501 strings used to generate path length fingerprints. Possible value: \fIYes or No\fR. Default value: | |
| 502 \&\fIYes\fR. | |
| 503 .Sp | |
| 504 \&\fIMinDistance\fR and \fIMaxDistance\fR parameters are only used during \fITopologicalAtomPairsFingerprints\fR | |
| 505 and \fITopologicalAtomTripletsFingerprints\fR values of \fIMolecularComplexityType\fR and correspond to | |
| 506 minimum and maximum bond distance between atom pairs during topological pharmacophore fingerprints. | |
| 507 Possible values: positive integers. Default value: \fIMinDistance \- 1\fR; \fIMaxDistance \- 10\fR. | |
| 508 .Sp | |
| 509 \&\fIUseTriangleInequality\fR parameter is used during these values for \fIMolecularComplexityType\fR: | |
| 510 \&\fITopologicalAtomTripletsFingerprints\fR and \fITopologicalPharmacophoreAtomTripletsFingerprints\fR. | |
| 511 Possible values: \fIYes or No\fR. It determines wheter to apply triangle inequality to distance triplets. | |
| 512 Default value: \fITopologicalAtomTripletsFingerprints \- No\fR; | |
| 513 \&\fITopologicalPharmacophoreAtomTripletsFingerprints \- Yes\fR. | |
| 514 .Sp | |
| 515 \&\fIDistanceBinSize\fR parameter is used during \fITopologicalPharmacophoreAtomTripletsFingerprints\fR | |
| 516 value of \fIMolecularComplexityType\fR and correspons to distance bin size used for binning | |
| 517 distances during generation of topological pharmacophore atom triplets fingerprints. Possible | |
| 518 value: positive integer. Default value: \fI2\fR. | |
| 519 .Sp | |
| 520 \&\fINormalizationMethodology\fR is only used for these values for \fIMolecularComplexityType\fR: | |
| 521 \&\fIExtendedConnectivityFingerprints\fR, \fITopologicalPharmacophoreAtomPairsFingerprints\fR | |
| 522 and \fITopologicalPharmacophoreAtomTripletsFingerprints\fR. It corresponds to normalization | |
| 523 methodology to use for scaling the number of bits-set or unique keys during generation of | |
| 524 fingerprints. Possible values during \fIExtendedConnectivityFingerprints\fR: \fINone or | |
| 525 ByHeavyAtomsCount\fR; Default value: \fINone\fR. Possible values during topological | |
| 526 pharmacophore atom pairs and tripletes fingerprints: \fINone or ByPossibleKeysCount\fR; | |
| 527 Default value: \fINone\fR. \fIByPossibleKeysCount\fR corresponds to total number of | |
| 528 possible topological pharmacophore atom pairs or triplets in a molecule. | |
| 529 .Sp | |
| 530 Examples of \fIMolecularComplexity\fR name and value parameters: | |
| 531 .Sp | |
| 532 .Vb 2 | |
| 533 \& MolecularComplexityType,AtomTypesFingerprints,AtomIdentifierType, | |
| 534 \& AtomicInvariantsAtomTypes,AtomicInvariantsToUse,AS X BO H FC | |
| 535 \& | |
| 536 \& MolecularComplexityType,ExtendedConnectivityFingerprints, | |
| 537 \& AtomIdentifierType,AtomicInvariantsAtomTypes, | |
| 538 \& AtomicInvariantsToUse,AS X BO H FC MN,NeighborhoodRadius,2, | |
| 539 \& NormalizationMethodology,None | |
| 540 \& | |
| 541 \& MolecularComplexityType,MACCSKeys,MACCSKeysSize,166 | |
| 542 \& | |
| 543 \& MolecularComplexityType,PathLengthFingerprints,AtomIdentifierType, | |
| 544 \& AtomicInvariantsAtomTypes,AtomicInvariantsToUse,AS,MinPathLength, | |
| 545 \& 1,MaxPathLength,8,UseBondSymbols,Yes | |
| 546 \& | |
| 547 \& MolecularComplexityType,TopologicalAtomPairsFingerprints, | |
| 548 \& AtomIdentifierType,AtomicInvariantsAtomTypes,AtomicInvariantsToUse, | |
| 549 \& AS X BO H FC,MinDistance,1,MaxDistance,10 | |
| 550 \& | |
| 551 \& MolecularComplexityType,TopologicalAtomTripletsFingerprints, | |
| 552 \& AtomIdentifierType,AtomicInvariantsAtomTypes,AtomicInvariantsToUse, | |
| 553 \& AS X BO H FC,MinDistance,1,MaxDistance,10,UseTriangleInequality,No | |
| 554 \& | |
| 555 \& MolecularComplexityType,TopologicalAtomTorsionsFingerprints, | |
| 556 \& AtomIdentifierType,AtomicInvariantsAtomTypes,AtomicInvariantsToUse, | |
| 557 \& AS X BO H FC | |
| 558 \& | |
| 559 \& MolecularComplexityType,TopologicalPharmacophoreAtomPairsFingerprints, | |
| 560 \& AtomIdentifierType,FunctionalClassAtomTypes,FunctionalClassesToUse, | |
| 561 \& HBD HBA PI NI H,MinDistance,1,MaxDistance,10,NormalizationMethodology, | |
| 562 \& None | |
| 563 \& | |
| 564 \& MolecularComplexityType,TopologicalPharmacophoreAtomTripletsFingerprints, | |
| 565 \& AtomIdentifierType,FunctionalClassAtomTypes,FunctionalClassesToUse, | |
| 566 \& HBD HBA PI NI H Ar,MinDistance,1,MaxDistance,10,NormalizationMethodology, | |
| 567 \& None,UseTriangleInequality,Yes,NormalizationMethodology,None, | |
| 568 \& DistanceBinSize,2 | |
| 569 .Ve | |
| 570 .IP "\fB\-\-OutDelim\fR \fIcomma | tab | semicolon\fR" 4 | |
| 571 .IX Item "--OutDelim comma | tab | semicolon" | |
| 572 Delimiter for output \s-1CSV/TSV\s0 text file(s). Possible values: \fIcomma, tab, or semicolon\fR | |
| 573 Default value: \fIcomma\fR. | |
| 574 .IP "\fB\-\-output\fR \fI\s-1SD\s0 | text | both\fR" 4 | |
| 575 .IX Item "--output SD | text | both" | |
| 576 Type of output files to generate. Possible values: \fI\s-1SD\s0, text, or both\fR. Default value: \fItext\fR. | |
| 577 .IP "\fB\-o, \-\-overwrite\fR" 4 | |
| 578 .IX Item "-o, --overwrite" | |
| 579 Overwrite existing files. | |
| 580 .IP "\fB\-\-Precision\fR \fIName,Number,[Name,Number,..]\fR" 4 | |
| 581 .IX Item "--Precision Name,Number,[Name,Number,..]" | |
| 582 Precision of calculated property values in the output file: it's a comma delimited list of | |
| 583 property name and precision value pairs. Possible property names: \fIMolecularWeight, | |
| 584 ExactMass\fR. Possible values: positive intergers. Default value: \fIMolecularWeight,2, | |
| 585 ExactMass,4\fR. | |
| 586 .Sp | |
| 587 Examples: | |
| 588 .Sp | |
| 589 .Vb 2 | |
| 590 \& ExactMass,3 | |
| 591 \& MolecularWeight,1,ExactMass,2 | |
| 592 .Ve | |
| 593 .IP "\fB\-q, \-\-quote\fR \fIYes | No\fR" 4 | |
| 594 .IX Item "-q, --quote Yes | No" | |
| 595 Put quote around column values in output \s-1CSV/TSV\s0 text file(s). Possible values: | |
| 596 \&\fIYes or No\fR. Default value: \fIYes\fR. | |
| 597 .IP "\fB\-r, \-\-root\fR \fIRootName\fR" 4 | |
| 598 .IX Item "-r, --root RootName" | |
| 599 New file name is generated using the root: <Root>.<Ext>. Default for new file names: | |
| 600 <SDFileName><PhysicochemicalProperties>.<Ext>. The file type determines <Ext> value. | |
| 601 The sdf, csv, and tsv <Ext> values are used for \s-1SD\s0, comma/semicolon, and tab | |
| 602 delimited text files, respectively.This option is ignored for multiple input files. | |
| 603 .IP "\fB\-\-RotatableBonds\fR \fIName,Value, [Name,Value,...]\fR" 4 | |
| 604 .IX Item "--RotatableBonds Name,Value, [Name,Value,...]" | |
| 605 Parameters to control calculation of rotatable bonds [ Ref 92 ]: it's a comma delimited list of parameter | |
| 606 name and value pairs. Possible parameter names: \fIIgnoreTerminalBonds, IgnoreBondsToTripleBonds, | |
| 607 IgnoreAmideBonds, IgnoreThioamideBonds, IgnoreSulfonamideBonds\fR. Possible parameter values: | |
| 608 \&\fIYes or No\fR. By default, value of all parameters is set to \fIYes\fR. | |
| 609 .IP "\fB\-\-RuleOf3Violations\fR \fIYes | No\fR" 4 | |
| 610 .IX Item "--RuleOf3Violations Yes | No" | |
| 611 Specify whether to calculate \fBRuleOf3Violations\fR for SDFile(s). Possible values: \fIYes or No\fR. | |
| 612 Default value: \fINo\fR. | |
| 613 .Sp | |
| 614 For \fIYes\fR value of \fBRuleOf3Violations\fR, in addition to calculating total number of \fBRuleOf3\fR violations, | |
| 615 individual violations for compounds are also written to output files. | |
| 616 .Sp | |
| 617 \&\fBRuleOf3\fR [ Ref 92 ] states: MolecularWeight <= 300, RotatableBonds <= 3, HydrogenBondDonors <= 3, | |
| 618 HydrogenBondAcceptors <= 3, logP <= 3, and \s-1TPSA\s0 <= 60. | |
| 619 .IP "\fB\-\-RuleOf5Violations\fR \fIYes | No\fR" 4 | |
| 620 .IX Item "--RuleOf5Violations Yes | No" | |
| 621 Specify whether to calculate \fBRuleOf5Violations\fR for SDFile(s). Possible values: \fIYes or No\fR. | |
| 622 Default value: \fINo\fR. | |
| 623 .Sp | |
| 624 For \fIYes\fR value of \fBRuleOf5Violations\fR, in addition to calculating total number of \fBRuleOf5\fR violations, | |
| 625 individual violations for compounds are also written to output files. | |
| 626 .Sp | |
| 627 \&\fBRuleOf5\fR [ Ref 91 ] states: MolecularWeight <= 500, HydrogenBondDonors <= 5, HydrogenBondAcceptors <= 10, | |
| 628 and logP <= 5. | |
| 629 .IP "\fB\-\-TPSA\fR \fIName,Value, [Name,Value,...]\fR" 4 | |
| 630 .IX Item "--TPSA Name,Value, [Name,Value,...]" | |
| 631 Parameters to control calculation of \s-1TPSA:\s0 it's a comma delimited list of parameter name and value | |
| 632 pairs. Possible parameter names: \fIIgnorePhosphorus, IgnoreSulfur\fR. Possible parameter values: | |
| 633 \&\fIYes or No\fR. By default, value of all parameters is set to \fIYes\fR. | |
| 634 .Sp | |
| 635 By default, \s-1TPSA\s0 atom contributions from Phosphorus and Sulfur atoms are not included during | |
| 636 \&\s-1TPSA\s0 calculations. [ Ref 91 ] | |
| 637 .IP "\fB\-w, \-\-WorkingDir\fR \fIDirName\fR" 4 | |
| 638 .IX Item "-w, --WorkingDir DirName" | |
| 639 Location of working directory. Default value: current directory. | |
| 640 .SH "EXAMPLES" | |
| 641 .IX Header "EXAMPLES" | |
| 642 To calculate default set of physicochemical properties \- MolecularWeight, HeavyAtoms, | |
| 643 MolecularVolume, RotatableBonds, HydrogenBondDonor, HydrogenBondAcceptors, SLogP, | |
| 644 \&\s-1TPSA\s0 \- and generate a SamplePhysicochemicalProperties.csv file containing sequential | |
| 645 compound IDs along with properties data, type: | |
| 646 .PP | |
| 647 .Vb 1 | |
| 648 \& % CalculatePhysicochemicalProperties.pl \-o Sample.sdf | |
| 649 .Ve | |
| 650 .PP | |
| 651 To calculate all available physicochemical properties and generate both SampleAllProperties.csv | |
| 652 and SampleAllProperties.sdf files containing sequential compound IDs in \s-1CSV\s0 file along with | |
| 653 properties data, type: | |
| 654 .PP | |
| 655 .Vb 2 | |
| 656 \& % CalculatePhysicochemicalProperties.pl \-m All \-\-output both | |
| 657 \& \-r SampleAllProperties \-o Sample.sdf | |
| 658 .Ve | |
| 659 .PP | |
| 660 To calculate RuleOf5 physicochemical properties and generate a SampleRuleOf5Properties.csv file | |
| 661 containing sequential compound IDs along with properties data, type: | |
| 662 .PP | |
| 663 .Vb 2 | |
| 664 \& % CalculatePhysicochemicalProperties.pl \-m RuleOf5 | |
| 665 \& \-r SampleRuleOf5Properties \-o Sample.sdf | |
| 666 .Ve | |
| 667 .PP | |
| 668 To calculate RuleOf5 physicochemical properties along with counting RuleOf5 violations and generate | |
| 669 a SampleRuleOf5Properties.csv file containing sequential compound IDs along with properties data, type: | |
| 670 .PP | |
| 671 .Vb 2 | |
| 672 \& % CalculatePhysicochemicalProperties.pl \-m RuleOf5 \-\-RuleOf5Violations Yes | |
| 673 \& \-r SampleRuleOf5Properties \-o Sample.sdf | |
| 674 .Ve | |
| 675 .PP | |
| 676 To calculate RuleOf3 physicochemical properties and generate a SampleRuleOf3Properties.csv file | |
| 677 containing sequential compound IDs along with properties data, type: | |
| 678 .PP | |
| 679 .Vb 2 | |
| 680 \& % CalculatePhysicochemicalProperties.pl \-m RuleOf3 | |
| 681 \& \-r SampleRuleOf3Properties \-o Sample.sdf | |
| 682 .Ve | |
| 683 .PP | |
| 684 To calculate RuleOf3 physicochemical properties along with counting RuleOf3 violations and generate | |
| 685 a SampleRuleOf3Properties.csv file containing sequential compound IDs along with properties data, type: | |
| 686 .PP | |
| 687 .Vb 2 | |
| 688 \& % CalculatePhysicochemicalProperties.pl \-m RuleOf3 \-\-RuleOf3Violations Yes | |
| 689 \& \-r SampleRuleOf3Properties \-o Sample.sdf | |
| 690 .Ve | |
| 691 .PP | |
| 692 To calculate a specific set of physicochemical properties and generate a SampleProperties.csv file | |
| 693 containing sequential compound IDs along with properties data, type: | |
| 694 .PP | |
| 695 .Vb 2 | |
| 696 \& % CalculatePhysicochemicalProperties.pl \-m "Rings,AromaticRings" | |
| 697 \& \-r SampleProperties \-o Sample.sdf | |
| 698 .Ve | |
| 699 .PP | |
| 700 To calculate HydrogenBondDonors and HydrogenBondAcceptors using HydrogenBondsType1 definition | |
| 701 and generate a SampleProperties.csv file containing sequential compound IDs along with properties | |
| 702 data, type: | |
| 703 .PP | |
| 704 .Vb 2 | |
| 705 \& % CalculatePhysicochemicalProperties.pl \-m "HydrogenBondDonors,HydrogenBondAcceptors" | |
| 706 \& \-\-HydrogenBonds HBondsType1 \-r SampleProperties \-o Sample.sdf | |
| 707 .Ve | |
| 708 .PP | |
| 709 To calculate \s-1TPSA\s0 using sulfur and phosphorus atoms along with nitrogen and oxygen atoms and | |
| 710 generate a SampleProperties.csv file containing sequential compound IDs along with properties | |
| 711 data, type: | |
| 712 .PP | |
| 713 .Vb 2 | |
| 714 \& % CalculatePhysicochemicalProperties.pl \-m "TPSA" \-\-TPSA "IgnorePhosphorus,No, | |
| 715 \& IgnoreSulfur,No" \-r SampleProperties \-o Sample.sdf | |
| 716 .Ve | |
| 717 .PP | |
| 718 To calculate MolecularComplexity using extendend connectivity fingerprints corresponding | |
| 719 to atom neighborhood radius of 2 with atomic invariant atom types without any scaling and | |
| 720 generate a SampleProperties.csv file containing sequential compound IDs along with properties | |
| 721 data, type: | |
| 722 .PP | |
| 723 .Vb 5 | |
| 724 \& % CalculatePhysicochemicalProperties.pl \-m MolecularComplexity \-\-MolecularComplexity | |
| 725 \& "MolecularComplexityType,ExtendedConnectivityFingerprints,NeighborhoodRadius,2, | |
| 726 \& AtomIdentifierType, AtomicInvariantsAtomTypes, | |
| 727 \& AtomicInvariantsToUse,AS X BO H FC MN,NormalizationMethodology,None" | |
| 728 \& \-r SampleProperties \-o Sample.sdf | |
| 729 .Ve | |
| 730 .PP | |
| 731 To calculate RuleOf5 physicochemical properties along with counting RuleOf5 violations and generate | |
| 732 a SampleRuleOf5Properties.csv file containing compound IDs from molecule name line along with | |
| 733 properties data, type: | |
| 734 .PP | |
| 735 .Vb 3 | |
| 736 \& % CalculatePhysicochemicalProperties.pl \-m RuleOf5 \-\-RuleOf5Violations Yes | |
| 737 \& \-\-DataFieldsMode CompoundID \-\-CompoundIDMode MolName | |
| 738 \& \-r SampleRuleOf5Properties \-o Sample.sdf | |
| 739 .Ve | |
| 740 .PP | |
| 741 To calculate all available physicochemical properties and generate a SampleAllProperties.csv | |
| 742 file containing compound \s-1ID\s0 using specified data field along with along with properties data, | |
| 743 type: | |
| 744 .PP | |
| 745 .Vb 3 | |
| 746 \& % CalculatePhysicochemicalProperties.pl \-m All | |
| 747 \& \-\-DataFieldsMode CompoundID \-\-CompoundIDMode DataField \-\-CompoundID Mol_ID | |
| 748 \& \-r SampleAllProperties \-o Sample.sdf | |
| 749 .Ve | |
| 750 .PP | |
| 751 To calculate all available physicochemical properties and generate a SampleAllProperties.csv | |
| 752 file containing compound \s-1ID\s0 using combination of molecule name line and an explicit compound | |
| 753 prefix along with properties data, type: | |
| 754 .PP | |
| 755 .Vb 4 | |
| 756 \& % CalculatePhysicochemicalProperties.pl \-m All | |
| 757 \& \-\-DataFieldsMode CompoundID \-\-CompoundIDMode MolnameOrLabelPrefix | |
| 758 \& \-\-CompoundID Cmpd \-\-CompoundIDLabel MolID \-r SampleAllProperties | |
| 759 \& \-o Sample.sdf | |
| 760 .Ve | |
| 761 .PP | |
| 762 To calculate all available physicochemical properties and generate a SampleAllProperties.csv | |
| 763 file containing specific data fields columns along with with properties data, type: | |
| 764 .PP | |
| 765 .Vb 3 | |
| 766 \& % CalculatePhysicochemicalProperties.pl \-m All | |
| 767 \& \-\-DataFieldsMode Specify \-\-DataFields Mol_ID \-r SampleAllProperties | |
| 768 \& \-o Sample.sdf | |
| 769 .Ve | |
| 770 .PP | |
| 771 To calculate all available physicochemical properties and generate a SampleAllProperties.csv | |
| 772 file containing common data fields columns along with with properties data, type: | |
| 773 .PP | |
| 774 .Vb 2 | |
| 775 \& % CalculatePhysicochemicalProperties.pl \-m All | |
| 776 \& \-\-DataFieldsMode Common \-r SampleAllProperties \-o Sample.sdf | |
| 777 .Ve | |
| 778 .PP | |
| 779 To calculate all available physicochemical properties and generate both SampleAllProperties.csv | |
| 780 and \s-1CSV\s0 files containing all data fields columns in \s-1CSV\s0 files along with with properties data, type: | |
| 781 .PP | |
| 782 .Vb 3 | |
| 783 \& % CalculatePhysicochemicalProperties.pl \-m All | |
| 784 \& \-\-DataFieldsMode All \-\-output both \-r SampleAllProperties | |
| 785 \& \-o Sample.sdf | |
| 786 .Ve | |
| 787 .SH "AUTHOR" | |
| 788 .IX Header "AUTHOR" | |
| 789 Manish Sud <msud@san.rr.com> | |
| 790 .SH "SEE ALSO" | |
| 791 .IX Header "SEE ALSO" | |
| 792 ExtractFromSDtFiles.pl, ExtractFromTextFiles.pl, InfoSDFiles.pl, InfoTextFiles.pl | |
| 793 .SH "COPYRIGHT" | |
| 794 .IX Header "COPYRIGHT" | |
| 795 Copyright (C) 2015 Manish Sud. All rights reserved. | |
| 796 .PP | |
| 797 This file is part of MayaChemTools. | |
| 798 .PP | |
| 799 MayaChemTools is free software; you can redistribute it and/or modify it under | |
| 800 the terms of the \s-1GNU\s0 Lesser General Public License as published by the Free | |
| 801 Software Foundation; either version 3 of the License, or (at your option) | |
| 802 any later version. |
