| 
0
 | 
     1 <html>
 | 
| 
 | 
     2 <head>
 | 
| 
 | 
     3 <title>MayaChemTools:Code:SimilaritySearchingFingerprints.pl</title>
 | 
| 
 | 
     4 <meta http-equiv="content-type" content="text/html;charset=utf-8">
 | 
| 
 | 
     5 <link rel="stylesheet" type="text/css" href="../../../css/MayaChemToolsCode.css">
 | 
| 
 | 
     6 </head>
 | 
| 
 | 
     7 <body leftmargin="20" rightmargin="20" topmargin="10" bottommargin="10">
 | 
| 
 | 
     8 <br/>
 | 
| 
 | 
     9 <center>
 | 
| 
 | 
    10 <a href="http://www.mayachemtools.org" title="MayaChemTools Home"><img src="../../../images/MayaChemToolsLogo.gif" border="0" alt="MayaChemTools"></a>
 | 
| 
 | 
    11 </center>
 | 
| 
 | 
    12 <br/>
 | 
| 
 | 
    13 <pre>
 | 
| 
 | 
    14    1 #!/usr/bin/perl -w
 | 
| 
 | 
    15    2 <span class="c">#</span>
 | 
| 
 | 
    16    3 <span class="c"># $RCSfile: SimilaritySearchingFingerprints.pl,v $</span>
 | 
| 
 | 
    17    4 <span class="c"># $Date: 2015/02/28 20:46:21 $</span>
 | 
| 
 | 
    18    5 <span class="c"># $Revision: 1.18 $</span>
 | 
| 
 | 
    19    6 <span class="c">#</span>
 | 
| 
 | 
    20    7 <span class="c"># Author: Manish Sud <msud@san.rr.com></span>
 | 
| 
 | 
    21    8 <span class="c">#</span>
 | 
| 
 | 
    22    9 <span class="c"># Copyright (C) 2015 Manish Sud. All rights reserved.</span>
 | 
| 
 | 
    23   10 <span class="c">#</span>
 | 
| 
 | 
    24   11 <span class="c"># This file is part of MayaChemTools.</span>
 | 
| 
 | 
    25   12 <span class="c">#</span>
 | 
| 
 | 
    26   13 <span class="c"># MayaChemTools is free software; you can redistribute it and/or modify it under</span>
 | 
| 
 | 
    27   14 <span class="c"># the terms of the GNU Lesser General Public License as published by the Free</span>
 | 
| 
 | 
    28   15 <span class="c"># Software Foundation; either version 3 of the License, or (at your option) any</span>
 | 
| 
 | 
    29   16 <span class="c"># later version.</span>
 | 
| 
 | 
    30   17 <span class="c">#</span>
 | 
| 
 | 
    31   18 <span class="c"># MayaChemTools is distributed in the hope that it will be useful, but without</span>
 | 
| 
 | 
    32   19 <span class="c"># any warranty; without even the implied warranty of merchantability of fitness</span>
 | 
| 
 | 
    33   20 <span class="c"># for a particular purpose.  See the GNU Lesser General Public License for more</span>
 | 
| 
 | 
    34   21 <span class="c"># details.</span>
 | 
| 
 | 
    35   22 <span class="c">#</span>
 | 
| 
 | 
    36   23 <span class="c"># You should have received a copy of the GNU Lesser General Public License</span>
 | 
| 
 | 
    37   24 <span class="c"># along with MayaChemTools; if not, see <http://www.gnu.org/licenses/> or</span>
 | 
| 
 | 
    38   25 <span class="c"># write to the Free Software Foundation Inc., 59 Temple Place, Suite 330,</span>
 | 
| 
 | 
    39   26 <span class="c"># Boston, MA, 02111-1307, USA.</span>
 | 
| 
 | 
    40   27 <span class="c">#</span>
 | 
| 
 | 
    41   28 
 | 
| 
 | 
    42   29 <span class="k">use</span> <span class="w">strict</span><span class="sc">;</span>
 | 
| 
 | 
    43   30 <span class="k">use</span> <span class="w">FindBin</span><span class="sc">;</span> <span class="k">use</span> <span class="w">lib</span> <span class="q">"$FindBin::Bin/../lib"</span><span class="sc">;</span>
 | 
| 
 | 
    44   31 <span class="k">use</span> <span class="w">Getopt::Long</span><span class="sc">;</span>
 | 
| 
 | 
    45   32 <span class="k">use</span> <span class="w">File::Basename</span><span class="sc">;</span>
 | 
| 
 | 
    46   33 <span class="k">use</span> <span class="w">Text::ParseWords</span><span class="sc">;</span>
 | 
| 
 | 
    47   34 <span class="k">use</span> <span class="w">Benchmark</span><span class="sc">;</span>
 | 
| 
 | 
    48   35 <span class="k">use</span> <span class="w">FileUtil</span><span class="sc">;</span>
 | 
| 
 | 
    49   36 <span class="k">use</span> <span class="w">TextUtil</span><span class="sc">;</span>
 | 
| 
 | 
    50   37 <span class="k">use</span> <span class="w">SDFileUtil</span><span class="sc">;</span>
 | 
| 
 | 
    51   38 <span class="k">use</span> <span class="w">StatisticsUtil</span><span class="sc">;</span>
 | 
| 
 | 
    52   39 <span class="k">use</span> <span class="w">PseudoHeap</span><span class="sc">;</span>
 | 
| 
 | 
    53   40 <span class="k">use</span> <span class="w">Fingerprints::FingerprintsFileUtil</span><span class="sc">;</span>
 | 
| 
 | 
    54   41 <span class="k">use</span> <span class="w">Fingerprints::FingerprintsBitVector</span><span class="sc">;</span>
 | 
| 
 | 
    55   42 <span class="k">use</span> <span class="w">Fingerprints::FingerprintsVector</span><span class="sc">;</span>
 | 
| 
 | 
    56   43 
 | 
| 
 | 
    57   44 <span class="k">my</span><span class="s">(</span><span class="i">$ScriptName</span><span class="cm">,</span> <span class="i">%Options</span><span class="cm">,</span> <span class="i">$StartTime</span><span class="cm">,</span> <span class="i">$EndTime</span><span class="cm">,</span> <span class="i">$TotalTime</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
    58   45 
 | 
| 
 | 
    59   46 <span class="c"># Autoflush STDOUT</span>
 | 
| 
 | 
    60   47 <span class="i">$|</span> = <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
    61   48 
 | 
| 
 | 
    62   49 <span class="c"># Starting message...</span>
 | 
| 
 | 
    63   50 <span class="i">$ScriptName</span> = <span class="i">basename</span><span class="s">(</span><span class="i">$0</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
    64   51 <span class="k">print</span> <span class="q">"\n$ScriptName: Starting...\n\n"</span><span class="sc">;</span>
 | 
| 
 | 
    65   52 <span class="i">$StartTime</span> = <span class="w">new</span> <span class="w">Benchmark</span><span class="sc">;</span>
 | 
| 
 | 
    66   53 
 | 
| 
 | 
    67   54 <span class="c"># Get the options and setup script...</span>
 | 
| 
 | 
    68   55 <span class="i">SetupScriptUsage</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
    69   56 <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">help</span>} || <span class="i">@ARGV</span> != <span class="n">2</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
    70   57   <span class="k">die</span> <span class="i">GetUsageFromPod</span><span class="s">(</span><span class="q">"$FindBin::Bin/$ScriptName"</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
    71   58 <span class="s">}</span>
 | 
| 
 | 
    72   59 
 | 
| 
 | 
    73   60 <span class="c"># Process reference and database file names...</span>
 | 
| 
 | 
    74   61 <span class="k">my</span><span class="s">(</span><span class="i">@FingerprintsFilesList</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
    75   62 <span class="i">ProcessFingerprintsFileNames</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
    76   63 
 | 
| 
 | 
    77   64 <span class="c"># Process options...</span>
 | 
| 
 | 
    78   65 <span class="k">print</span> <span class="q">"Processing options...\n"</span><span class="sc">;</span>
 | 
| 
 | 
    79   66 <span class="k">my</span><span class="s">(</span><span class="i">%OptionsInfo</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
    80   67 <span class="i">ProcessOptions</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
    81   68 
 | 
| 
 | 
    82   69 <span class="c"># Setup information about fingerprints inut and SD/text output files...</span>
 | 
| 
 | 
    83   70 <span class="k">my</span><span class="s">(</span><span class="i">%FingerprintsFilesInfo</span><span class="cm">,</span> <span class="i">%OutputFilesInfo</span><span class="cm">,</span> <span class="i">%SimilaritySearchInfo</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
    84   71 <span class="k">print</span> <span class="q">"Checking and retrieving information from reference and database fingerprints files...\n"</span><span class="sc">;</span>
 | 
| 
 | 
    85   72 <span class="i">RetrieveFingerprintsFilesInfo</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
    86   73 
 | 
| 
 | 
    87   74 <span class="c"># Perform similarity search...</span>
 | 
| 
 | 
    88   75 <span class="k">print</span> <span class="q">"Performing similarity search...\n"</span><span class="sc">;</span>
 | 
| 
 | 
    89   76 <span class="k">my</span><span class="s">(</span><span class="i">%SimilaritySearchResults</span><span class="cm">,</span> <span class="i">%DatabaseFingerprintsFileData</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
    90   77 <span class="i">PerformSimilaritySearch</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
    91   78 
 | 
| 
 | 
    92   79 <span class="k">print</span> <span class="q">"\n$ScriptName:Done...\n\n"</span><span class="sc">;</span>
 | 
| 
 | 
    93   80 
 | 
| 
 | 
    94   81 <span class="i">$EndTime</span> = <span class="w">new</span> <span class="w">Benchmark</span><span class="sc">;</span>
 | 
| 
 | 
    95   82 <span class="i">$TotalTime</span> = <span class="w">timediff</span> <span class="s">(</span><span class="i">$EndTime</span><span class="cm">,</span> <span class="i">$StartTime</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
    96   83 <span class="k">print</span> <span class="q">"Total time: "</span><span class="cm">,</span> <span class="i">timestr</span><span class="s">(</span><span class="i">$TotalTime</span><span class="s">)</span><span class="cm">,</span> <span class="q">"\n"</span><span class="sc">;</span>
 | 
| 
 | 
    97   84 
 | 
| 
 | 
    98   85 <span class="c">###############################################################################</span>
 | 
| 
 | 
    99   86 
 | 
| 
 | 
   100   87 <span class="c"># Perform similarity search using fingerprints data in reference and database text files...</span>
 | 
| 
 | 
   101   88 <span class="c">#</span>
 | 
| 
 | 
   102 <a name="PerformSimilaritySearch-"></a>  89 <span class="k">sub </span><span class="m">PerformSimilaritySearch</span> <span class="s">{</span>
 | 
| 
 | 
   103   90 
 | 
| 
 | 
   104   91   <span class="k">print</span> <span class="q">"\nProcessing fingerprints data for reference molecules...\n"</span><span class="sc">;</span>
 | 
| 
 | 
   105   92   <span class="i">ReadReferenceFingerprintsData</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   106   93 
 | 
| 
 | 
   107   94   <span class="i">InitializeSimilaritySearchResults</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   108   95   <span class="i">GenerateSimilaritySearchResults</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   109   96   <span class="i">WriteSimilaritySearchResultFiles</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   110   97 <span class="s">}</span>
 | 
| 
 | 
   111   98 
 | 
| 
 | 
   112   99 <span class="c"># Find similar molecules from database molecules for individual or multiple reference molecules...</span>
 | 
| 
 | 
   113  100 <span class="c">#</span>
 | 
| 
 | 
   114 <a name="GenerateSimilaritySearchResults-"></a> 101 <span class="k">sub </span><span class="m">GenerateSimilaritySearchResults</span> <span class="s">{</span>
 | 
| 
 | 
   115  102   <span class="k">my</span><span class="s">(</span><span class="i">$DatabaseFingerprintsFileIO</span><span class="cm">,</span> <span class="i">$FingerprintsCount</span><span class="cm">,</span> <span class="i">$IgnoredFingerprintsCount</span><span class="cm">,</span> <span class="i">$DatabaseFingerprintsObject</span><span class="cm">,</span> <span class="i">$DatabaseCmpdID</span><span class="cm">,</span> <span class="i">$ReferenceFingerprintsObject</span><span class="cm">,</span> <span class="i">$ReferenceIndex</span><span class="cm">,</span> <span class="i">$ReferenceCmpdID</span><span class="cm">,</span> <span class="i">$ComparisonValue</span><span class="cm">,</span> <span class="i">$FusedComparisonValue</span><span class="cm">,</span> <span class="i">@ComparisonValues</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   116  103 
 | 
| 
 | 
   117  104   <span class="k">print</span> <span class="q">"Processing fingerprints data for database molecules...\n"</span><span class="sc">;</span>
 | 
| 
 | 
   118  105 
 | 
| 
 | 
   119  106   <span class="s">(</span><span class="i">$FingerprintsCount</span><span class="cm">,</span> <span class="i">$IgnoredFingerprintsCount</span><span class="s">)</span> = <span class="s">(</span><span class="n">0</span><span class="s">)</span> x <span class="n">3</span><span class="sc">;</span>
 | 
| 
 | 
   120  107 
 | 
| 
 | 
   121  108   <span class="i">$DatabaseFingerprintsFileIO</span> = <span class="i">Fingerprints::FingerprintsFileUtil::NewFingerprintsFileIO</span><span class="s">(</span><span class="i">%</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">FingerprintsFileIOParameters</span>}}<span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   122  109   <span class="i">$DatabaseFingerprintsFileIO</span><span class="i">->Open</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   123  110 
 | 
| 
 | 
   124  111   <span class="i">@ComparisonValues</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   125  112 
 | 
| 
 | 
   126  113   <span class="j">DATABASEFP:</span> <span class="k">while</span> <span class="s">(</span><span class="i">$DatabaseFingerprintsFileIO</span><span class="i">->Read</span><span class="s">(</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   127  114     <span class="i">$FingerprintsCount</span>++<span class="sc">;</span>
 | 
| 
 | 
   128  115 
 | 
| 
 | 
   129  116     <span class="k">if</span> <span class="s">(</span>!<span class="i">$DatabaseFingerprintsFileIO</span><span class="i">->IsFingerprintsDataValid</span><span class="s">(</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   130  117       <span class="i">$IgnoredFingerprintsCount</span>++<span class="sc">;</span>
 | 
| 
 | 
   131  118       <span class="k">next</span> <span class="j">DATABASEFP</span><span class="sc">;</span>
 | 
| 
 | 
   132  119     <span class="s">}</span>
 | 
| 
 | 
   133  120     <span class="i">$DatabaseFingerprintsObject</span> = <span class="i">$DatabaseFingerprintsFileIO</span><span class="i">->GetFingerprints</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   134  121     <span class="i">$DatabaseCmpdID</span> = <span class="i">$DatabaseFingerprintsFileIO</span><span class="i">->GetCompoundID</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   135  122 
 | 
| 
 | 
   136  123     <span class="k">if</span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">MultipleReferencesMode</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   137  124       <span class="i">@ComparisonValues</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   138  125     <span class="s">}</span>
 | 
| 
 | 
   139  126 
 | 
| 
 | 
   140  127     <span class="j">REFERENCEFP:</span> <span class="k">for</span> <span class="i">$ReferenceIndex</span> <span class="s">(</span><span class="n">0</span> .. <span class="i">$#</span>{<span class="i">$SimilaritySearchInfo</span>{<span class="w">ReferenceCmpdIDsRef</span>}}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   141  128       <span class="i">$ReferenceCmpdID</span> = <span class="i">$SimilaritySearchInfo</span>{<span class="w">ReferenceCmpdIDsRef</span>}->[<span class="i">$ReferenceIndex</span>]<span class="sc">;</span>
 | 
| 
 | 
   142  129       <span class="i">$ReferenceFingerprintsObject</span> = <span class="i">$SimilaritySearchInfo</span>{<span class="w">ReferenceFingerprintsObjectsRef</span>}->[<span class="i">$ReferenceIndex</span>]<span class="sc">;</span>
 | 
| 
 | 
   143  130 
 | 
| 
 | 
   144  131       <span class="i">$ComparisonValue</span> = <span class="i">CompareReferenceAndDatabaseFingerprintsPair</span><span class="s">(</span><span class="i">$ReferenceFingerprintsObject</span><span class="cm">,</span> <span class="i">$DatabaseFingerprintsObject</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   145  132       <span class="k">if</span> <span class="s">(</span>!<span class="k">defined</span> <span class="i">$ComparisonValue</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   146  133         <span class="k">next</span> <span class="j">REFERENCEFP</span><span class="sc">;</span>
 | 
| 
 | 
   147  134       <span class="s">}</span>
 | 
| 
 | 
   148  135 
 | 
| 
 | 
   149  136       <span class="k">if</span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">IndividualReferenceMode</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   150  137         <span class="i">CollectSimilaritySearchResults</span><span class="s">(</span><span class="i">$DatabaseFingerprintsFileIO</span><span class="cm">,</span> <span class="i">$DatabaseCmpdID</span><span class="cm">,</span> <span class="i">$ComparisonValue</span><span class="cm">,</span> <span class="i">$ReferenceCmpdID</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   151  138       <span class="s">}</span>
 | 
| 
 | 
   152  139       <span class="k">elsif</span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">MultipleReferencesMode</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   153  140         <span class="k">push</span> <span class="i">@ComparisonValues</span><span class="cm">,</span> <span class="i">$ComparisonValue</span><span class="sc">;</span>
 | 
| 
 | 
   154  141       <span class="s">}</span>
 | 
| 
 | 
   155  142     <span class="s">}</span>
 | 
| 
 | 
   156  143 
 | 
| 
 | 
   157  144     <span class="k">if</span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">MultipleReferencesMode</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   158  145       <span class="i">$FusedComparisonValue</span> = <span class="i">CalculateGroupFusionComparisonValue</span><span class="s">(</span>\<span class="i">@ComparisonValues</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   159  146       <span class="k">if</span> <span class="s">(</span>!<span class="k">defined</span> <span class="i">$FusedComparisonValue</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   160  147         <span class="k">next</span> <span class="j">DATABASEFP</span><span class="sc">;</span>
 | 
| 
 | 
   161  148       <span class="s">}</span>
 | 
| 
 | 
   162  149       <span class="i">CollectSimilaritySearchResults</span><span class="s">(</span><span class="i">$DatabaseFingerprintsFileIO</span><span class="cm">,</span> <span class="i">$DatabaseCmpdID</span><span class="cm">,</span> <span class="i">$FusedComparisonValue</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   163  150     <span class="s">}</span>
 | 
| 
 | 
   164  151   <span class="s">}</span>
 | 
| 
 | 
   165  152   <span class="i">$DatabaseFingerprintsFileIO</span><span class="i">->Close</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   166  153 
 | 
| 
 | 
   167  154   <span class="k">print</span> <span class="q">"Number of fingerprints data entries in database fingerprints file: $FingerprintsCount\n"</span><span class="sc">;</span>
 | 
| 
 | 
   168  155   <span class="k">print</span> <span class="q">"Number of fingerprints date entries processed successfully: "</span><span class="cm">,</span> <span class="s">(</span><span class="i">$FingerprintsCount</span> - <span class="i">$IgnoredFingerprintsCount</span><span class="s">)</span>  <span class="cm">,</span> <span class="q">"\n"</span><span class="sc">;</span>
 | 
| 
 | 
   169  156   <span class="k">print</span> <span class="q">"Number of fingerprints data entries ignored due to missing/invalid data: $IgnoredFingerprintsCount\n\n"</span><span class="sc">;</span>
 | 
| 
 | 
   170  157 <span class="s">}</span>
 | 
| 
 | 
   171  158 
 | 
| 
 | 
   172  159 <span class="c"># Compare a pair of reference and database fingerprints objects corresponding to bit-vector or</span>
 | 
| 
 | 
   173  160 <span class="c"># vectors using specified comparison method and comparison cutoff...</span>
 | 
| 
 | 
   174  161 <span class="c">#</span>
 | 
| 
 | 
   175 <a name="CompareReferenceAndDatabaseFingerprintsPair-"></a> 162 <span class="k">sub </span><span class="m">CompareReferenceAndDatabaseFingerprintsPair</span> <span class="s">{</span>
 | 
| 
 | 
   176  163   <span class="k">my</span><span class="s">(</span><span class="i">$ReferenceFingerprintsObject</span><span class="cm">,</span> <span class="i">$DatabaseFingerprintsObject</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   177  164   <span class="k">my</span><span class="s">(</span><span class="i">$ComparisonMethod</span><span class="cm">,</span> <span class="i">$ComparisonValue</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   178  165 
 | 
| 
 | 
   179  166   <span class="i">$ComparisonMethod</span> = <span class="i">$SimilaritySearchInfo</span>{<span class="w">ComparisonMethod</span>}<span class="sc">;</span>
 | 
| 
 | 
   180  167   <span class="i">$ComparisonValue</span> = <span class="i">$ReferenceFingerprintsObject</span><span class="i">->$ComparisonMethod</span><span class="s">(</span><span class="i">$DatabaseFingerprintsObject</span><span class="cm">,</span> <span class="i">@</span>{<span class="i">$SimilaritySearchInfo</span>{<span class="w">ComparisonMethodParameters</span>}}<span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   181  168 
 | 
| 
 | 
   182  169   <span class="k">if</span> <span class="s">(</span>!<span class="k">defined</span> <span class="i">$ComparisonValue</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   183  170     <span class="k">warn</span> <span class="q">"Warning: Ignoring fingerprints data for reference compound ID "</span><span class="cm">,</span>  <span class="i">$ReferenceFingerprintsObject</span><span class="i">->GetID</span><span class="s">(</span><span class="s">)</span><span class="cm">,</span> <span class="q">": Its comparison with database compound ID, "</span><span class="cm">,</span> <span class="i">$DatabaseFingerprintsObject</span><span class="i">->GetID</span><span class="s">(</span><span class="s">)</span><span class="cm">,</span> <span class="q">", failed.\n"</span><span class="sc">;</span>
 | 
| 
 | 
   184  171     <span class="k">return</span> <span class="k">undef</span><span class="sc">;</span>
 | 
| 
 | 
   185  172   <span class="s">}</span>
 | 
| 
 | 
   186  173 
 | 
| 
 | 
   187  174   <span class="i">$ComparisonValue</span> = <span class="k">sprintf</span><span class="s">(</span><span class="q">"%.$OptionsInfo{Precision}f"</span><span class="cm">,</span> <span class="i">$ComparisonValue</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   188  175 
 | 
| 
 | 
   189  176   <span class="c"># Apply any comparison cutoff...</span>
 | 
| 
 | 
   190  177   <span class="k">if</span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">ApplyComparisonCutoff</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   191  178     <span class="k">return</span> <span class="i">$SimilaritySearchInfo</span>{<span class="w">KeepTop</span>} ? <span class="s">(</span><span class="i">$ComparisonValue</span> >= <span class="i">$SimilaritySearchInfo</span>{<span class="w">ComparisonCutoff</span>} ? <span class="i">$ComparisonValue</span> <span class="co">:</span> <span class="k">undef</span><span class="s">)</span> <span class="co">:</span> <span class="s">(</span><span class="i">$ComparisonValue</span> <= <span class="i">$SimilaritySearchInfo</span>{<span class="w">ComparisonCutoff</span>} ? <span class="i">$ComparisonValue</span> <span class="co">:</span> <span class="k">undef</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   192  179   <span class="s">}</span>
 | 
| 
 | 
   193  180   <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
   194  181     <span class="k">return</span> <span class="i">$ComparisonValue</span><span class="sc">;</span>
 | 
| 
 | 
   195  182   <span class="s">}</span>
 | 
| 
 | 
   196  183 <span class="s">}</span>
 | 
| 
 | 
   197  184 
 | 
| 
 | 
   198  185 <span class="c"># Calculate group fusion comparison value...</span>
 | 
| 
 | 
   199  186 <span class="c">#</span>
 | 
| 
 | 
   200 <a name="CalculateGroupFusionComparisonValue-"></a> 187 <span class="k">sub </span><span class="m">CalculateGroupFusionComparisonValue</span> <span class="s">{</span>
 | 
| 
 | 
   201  188   <span class="k">my</span><span class="s">(</span><span class="i">$ComparisonValuesRef</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   202  189   <span class="k">my</span><span class="s">(</span><span class="i">$FusedComparisonValue</span><span class="cm">,</span> <span class="i">@ComparisonValues</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   203  190 
 | 
| 
 | 
   204  191   <span class="k">if</span> <span class="s">(</span>!<span class="i">@</span>{<span class="i">$ComparisonValuesRef</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   205  192     <span class="k">return</span> <span class="k">undef</span><span class="sc">;</span>
 | 
| 
 | 
   206  193   <span class="s">}</span>
 | 
| 
 | 
   207  194 
 | 
| 
 | 
   208  195   <span class="k">if</span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">SortComparisonValues</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   209  196     <span class="i">@ComparisonValues</span> = <span class="k">sort</span> <span class="s">{</span> <span class="i">$SimilaritySearchInfo</span>{<span class="w">KeepTop</span>} ? <span class="s">(</span><span class="i">$b</span> <=> <span class="i">$a</span><span class="s">)</span> <span class="co">:</span> <span class="s">(</span><span class="i">$a</span> <=> <span class="i">$b</span><span class="s">)</span> <span class="s">}</span> <span class="i">@</span>{<span class="i">$ComparisonValuesRef</span>}<span class="sc">;</span>
 | 
| 
 | 
   210  197     <span class="k">if</span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">UsekNN</span>} && <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">kNN</span>} < <span class="k">scalar</span> <span class="i">@</span>{<span class="i">$ComparisonValuesRef</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   211  198       <span class="c"># Keep only top kNN values for group fusion...</span>
 | 
| 
 | 
   212  199       <span class="k">splice</span> <span class="i">@ComparisonValues</span><span class="cm">,</span> <span class="i">$OptionsInfo</span>{<span class="w">kNN</span>}<span class="sc">;</span>
 | 
| 
 | 
   213  200     <span class="s">}</span>
 | 
| 
 | 
   214  201     <span class="i">$ComparisonValuesRef</span> = \<span class="i">@ComparisonValues</span><span class="sc">;</span>
 | 
| 
 | 
   215  202   <span class="s">}</span>
 | 
| 
 | 
   216  203 
 | 
| 
 | 
   217  204   <span class="i">$FusedComparisonValue</span> = <span class="i">&</span>{<span class="i">$SimilaritySearchInfo</span>{<span class="w">GroupFusionMethodRef</span>}}<span class="s">(</span><span class="i">$ComparisonValuesRef</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   218  205   <span class="k">if</span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">ApplyPrecisionDuringFusion</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   219  206     <span class="i">$FusedComparisonValue</span> = <span class="k">sprintf</span><span class="s">(</span><span class="q">"%.$OptionsInfo{Precision}f"</span><span class="cm">,</span> <span class="i">$FusedComparisonValue</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   220  207   <span class="s">}</span>
 | 
| 
 | 
   221  208 
 | 
| 
 | 
   222  209   <span class="k">return</span> <span class="i">$FusedComparisonValue</span><span class="sc">;</span>
 | 
| 
 | 
   223  210 <span class="s">}</span>
 | 
| 
 | 
   224  211 
 | 
| 
 | 
   225  212 <span class="c"># Collect similarity results for individual reference and multiple references search...</span>
 | 
| 
 | 
   226  213 <span class="c">#</span>
 | 
| 
 | 
   227 <a name="CollectSimilaritySearchResults-"></a> 214 <span class="k">sub </span><span class="m">CollectSimilaritySearchResults</span> <span class="s">{</span>
 | 
| 
 | 
   228  215   <span class="k">my</span><span class="s">(</span><span class="i">$DatabaseFingerprintsFileIO</span><span class="cm">,</span> <span class="i">$DatabaseCmpdID</span><span class="cm">,</span> <span class="i">$ComparisonValue</span><span class="cm">,</span> <span class="i">$ReferenceCmpdID</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   229  216 
 | 
| 
 | 
   230  217   <span class="k">if</span> <span class="s">(</span><span class="k">defined</span> <span class="i">$ReferenceCmpdID</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   231  218     <span class="i">$SimilaritySearchResults</span>{<span class="i">$ReferenceCmpdID</span>}<span class="i">->AddKeyValuePair</span><span class="s">(</span><span class="i">$ComparisonValue</span><span class="cm">,</span> <span class="i">$DatabaseCmpdID</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   232  219   <span class="s">}</span>
 | 
| 
 | 
   233  220   <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
   234  221     <span class="i">$SimilaritySearchResults</span>{<span class="w">ResultsPseudoHeap</span>}<span class="i">->AddKeyValuePair</span><span class="s">(</span><span class="i">$ComparisonValue</span><span class="cm">,</span> <span class="i">$DatabaseCmpdID</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   235  222   <span class="s">}</span>
 | 
| 
 | 
   236  223 
 | 
| 
 | 
   237  224   <span class="k">if</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">CollectInputFileData</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   238  225     <span class="i">CollectDatabaseFileData</span><span class="s">(</span><span class="i">$DatabaseCmpdID</span><span class="cm">,</span> <span class="i">$DatabaseFingerprintsFileIO</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   239  226   <span class="s">}</span>
 | 
| 
 | 
   240  227 <span class="s">}</span>
 | 
| 
 | 
   241  228 
 | 
| 
 | 
   242  229 <span class="c"># Initialize similarity results for individual or multiple reference molecules...</span>
 | 
| 
 | 
   243  230 <span class="c">#</span>
 | 
| 
 | 
   244 <a name="InitializeSimilaritySearchResults-"></a> 231 <span class="k">sub </span><span class="m">InitializeSimilaritySearchResults</span> <span class="s">{</span>
 | 
| 
 | 
   245  232   <span class="k">my</span><span class="s">(</span><span class="i">$ReferenceCmpdID</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   246  233 
 | 
| 
 | 
   247  234   <span class="i">%SimilaritySearchResults</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   248  235 
 | 
| 
 | 
   249  236   <span class="k">if</span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">IndividualReferenceMode</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   250  237     <span class="k">for</span> <span class="i">$ReferenceCmpdID</span> <span class="s">(</span><span class="i">@</span>{<span class="i">$SimilaritySearchInfo</span>{<span class="w">ReferenceCmpdIDsRef</span>}}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   251  238       <span class="i">$SimilaritySearchResults</span>{<span class="i">$ReferenceCmpdID</span>} = <span class="w">new</span> <span class="i">PseudoHeap</span><span class="s">(</span><span class="q">'Type'</span> <span class="cm">=></span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">KeepTop</span>} ? <span class="q">'KeepTopN'</span> <span class="co">:</span> <span class="q">'KeepBottomN'</span><span class="s">)</span><span class="cm">,</span> <span class="q">'KeyType'</span> <span class="cm">=></span> <span class="q">'Numeric'</span><span class="cm">,</span> <span class="q">'MaxSize'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="w">MaxSimilarMolecules</span>}<span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   252  239     <span class="s">}</span>
 | 
| 
 | 
   253  240   <span class="s">}</span>
 | 
| 
 | 
   254  241   <span class="k">elsif</span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">MultipleReferencesMode</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   255  242     <span class="i">$SimilaritySearchResults</span>{<span class="w">ResultsPseudoHeap</span>} = <span class="w">new</span> <span class="i">PseudoHeap</span><span class="s">(</span><span class="q">'Type'</span> <span class="cm">=></span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">KeepTop</span>} ? <span class="q">'KeepTopN'</span> <span class="co">:</span> <span class="q">'KeepBottomN'</span><span class="s">)</span><span class="cm">,</span> <span class="q">'KeyType'</span> <span class="cm">=></span> <span class="q">'Numeric'</span><span class="cm">,</span> <span class="q">'MaxSize'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="w">MaxSimilarMolecules</span>}<span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   256  243   <span class="s">}</span>
 | 
| 
 | 
   257  244 
 | 
| 
 | 
   258  245   <span class="i">%DatabaseFingerprintsFileData</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   259  246 <span class="s">}</span>
 | 
| 
 | 
   260  247 
 | 
| 
 | 
   261  248 <span class="c"># Write out results SD and/or CSV/TSV text files for individual or multiple reference molecules...</span>
 | 
| 
 | 
   262  249 <span class="c">#</span>
 | 
| 
 | 
   263 <a name="WriteSimilaritySearchResultFiles-"></a> 250 <span class="k">sub </span><span class="m">WriteSimilaritySearchResultFiles</span> <span class="s">{</span>
 | 
| 
 | 
   264  251   <span class="k">my</span><span class="s">(</span><span class="i">$NewSDFileRef</span><span class="cm">,</span> <span class="i">$NewTextFileRef</span><span class="cm">,</span> <span class="i">$ReferenceCmpdID</span><span class="cm">,</span> <span class="i">$DatabaseCmpdID</span><span class="cm">,</span> <span class="i">$ComparisonValue</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   265  252 
 | 
| 
 | 
   266  253   <span class="s">(</span><span class="i">$NewSDFileRef</span><span class="cm">,</span> <span class="i">$NewTextFileRef</span><span class="s">)</span> = <span class="i">SetupAndOpenOutputFiles</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   267  254 
 | 
| 
 | 
   268  255   <span class="k">if</span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">IndividualReferenceMode</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   269  256     <span class="k">for</span> <span class="i">$ReferenceCmpdID</span> <span class="s">(</span><span class="i">@</span>{<span class="i">$SimilaritySearchInfo</span>{<span class="w">ReferenceCmpdIDsRef</span>}}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   270  257       <span class="k">for</span> <span class="i">$ComparisonValue</span> <span class="s">(</span><span class="i">$SimilaritySearchResults</span>{<span class="i">$ReferenceCmpdID</span>}<span class="i">->GetSortedKeys</span><span class="s">(</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   271  258         <span class="k">for</span> <span class="i">$DatabaseCmpdID</span> <span class="s">(</span><span class="i">$SimilaritySearchResults</span>{<span class="i">$ReferenceCmpdID</span>}<span class="i">->GetKeyValues</span><span class="s">(</span><span class="i">$ComparisonValue</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   272  259           <span class="i">WriteDataToOutputFiles</span><span class="s">(</span><span class="i">$NewSDFileRef</span><span class="cm">,</span> <span class="i">$NewTextFileRef</span><span class="cm">,</span> <span class="i">$ComparisonValue</span><span class="cm">,</span> <span class="i">$DatabaseCmpdID</span><span class="cm">,</span> <span class="i">$ReferenceCmpdID</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   273  260         <span class="s">}</span>
 | 
| 
 | 
   274  261       <span class="s">}</span>
 | 
| 
 | 
   275  262     <span class="s">}</span>
 | 
| 
 | 
   276  263   <span class="s">}</span>
 | 
| 
 | 
   277  264   <span class="k">elsif</span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">MultipleReferencesMode</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   278  265     <span class="k">for</span> <span class="i">$ComparisonValue</span> <span class="s">(</span><span class="i">$SimilaritySearchResults</span>{<span class="w">ResultsPseudoHeap</span>}<span class="i">->GetSortedKeys</span><span class="s">(</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   279  266       <span class="k">for</span> <span class="i">$DatabaseCmpdID</span> <span class="s">(</span><span class="i">$SimilaritySearchResults</span>{<span class="w">ResultsPseudoHeap</span>}<span class="i">->GetKeyValues</span><span class="s">(</span><span class="i">$ComparisonValue</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   280  267         <span class="i">WriteDataToOutputFiles</span><span class="s">(</span><span class="i">$NewSDFileRef</span><span class="cm">,</span> <span class="i">$NewTextFileRef</span><span class="cm">,</span> <span class="i">$ComparisonValue</span><span class="cm">,</span> <span class="i">$DatabaseCmpdID</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   281  268       <span class="s">}</span>
 | 
| 
 | 
   282  269     <span class="s">}</span>
 | 
| 
 | 
   283  270   <span class="s">}</span>
 | 
| 
 | 
   284  271 
 | 
| 
 | 
   285  272   <span class="k">if</span> <span class="s">(</span><span class="i">$NewSDFileRef</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   286  273     <span class="k">close</span> <span class="i">$NewSDFileRef</span><span class="sc">;</span>
 | 
| 
 | 
   287  274   <span class="s">}</span>
 | 
| 
 | 
   288  275   <span class="k">if</span> <span class="s">(</span><span class="i">$NewTextFileRef</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   289  276     <span class="k">close</span> <span class="i">$NewTextFileRef</span><span class="sc">;</span>
 | 
| 
 | 
   290  277   <span class="s">}</span>
 | 
| 
 | 
   291  278 <span class="s">}</span>
 | 
| 
 | 
   292  279 
 | 
| 
 | 
   293  280 <span class="c"># Write individual reference or multiple references similarity results along with any other data to output files...</span>
 | 
| 
 | 
   294  281 <span class="c">#</span>
 | 
| 
 | 
   295 <a name="WriteDataToOutputFiles-"></a> 282 <span class="k">sub </span><span class="m">WriteDataToOutputFiles</span> <span class="s">{</span>
 | 
| 
 | 
   296  283   <span class="k">my</span><span class="s">(</span><span class="i">$NewSDFileRef</span><span class="cm">,</span> <span class="i">$NewTextFileRef</span><span class="cm">,</span> <span class="i">$ComparisonValue</span><span class="cm">,</span> <span class="i">$DatabaseCmpdID</span><span class="cm">,</span> <span class="i">$ReferenceCmpdID</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   297  284 
 | 
| 
 | 
   298  285   <span class="k">if</span> <span class="s">(</span><span class="i">$NewSDFileRef</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   299  286     <span class="i">WriteMolStringDataToSDOutputFile</span><span class="s">(</span><span class="i">$DatabaseCmpdID</span><span class="cm">,</span> <span class="i">$NewSDFileRef</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   300  287     <span class="k">if</span> <span class="s">(</span><span class="k">defined</span> <span class="i">$ReferenceCmpdID</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   301  288       <span class="k">print</span> <span class="i">$NewSDFileRef</span>  <span class="q">">  <ReferenceCmpdID>\n$ReferenceCmpdID\n\n"</span><span class="sc">;</span>
 | 
| 
 | 
   302  289     <span class="s">}</span>
 | 
| 
 | 
   303  290     <span class="k">print</span> <span class="i">$NewSDFileRef</span>  <span class="q">">  <DatabaseCmpdID>\n$DatabaseCmpdID\n\n>  <ComparisonValue>\n$ComparisonValue\n\n"</span><span class="sc">;</span>
 | 
| 
 | 
   304  291     <span class="i">WriteDatabaseDataToSDOutputFile</span><span class="s">(</span><span class="i">$DatabaseCmpdID</span><span class="cm">,</span> <span class="i">$NewSDFileRef</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   305  292     <span class="k">print</span> <span class="i">$NewSDFileRef</span> <span class="q">"\$\$\$\$\n"</span><span class="sc">;</span>
 | 
| 
 | 
   306  293   <span class="s">}</span>
 | 
| 
 | 
   307  294 
 | 
| 
 | 
   308  295   <span class="k">if</span> <span class="s">(</span><span class="i">$NewTextFileRef</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   309  296     <span class="k">my</span><span class="s">(</span><span class="i">@LineWords</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   310  297 
 | 
| 
 | 
   311  298     <span class="i">@LineWords</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   312  299     <span class="k">if</span> <span class="s">(</span><span class="k">defined</span> <span class="i">$ReferenceCmpdID</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   313  300       <span class="k">push</span> <span class="i">@LineWords</span><span class="cm">,</span> <span class="i">$ReferenceCmpdID</span><span class="sc">;</span>
 | 
| 
 | 
   314  301     <span class="s">}</span>
 | 
| 
 | 
   315  302     <span class="k">push</span> <span class="i">@LineWords</span><span class="cm">,</span> <span class="s">(</span><span class="i">$DatabaseCmpdID</span><span class="cm">,</span> <span class="i">$ComparisonValue</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   316  303 
 | 
| 
 | 
   317  304     <span class="k">if</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputDataFields</span>} || <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputDataCols</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   318  305       <span class="k">push</span> <span class="i">@LineWords</span><span class="cm">,</span> <span class="i">RetrieveDatabaseDataForTextOutputFile</span><span class="s">(</span><span class="i">$DatabaseCmpdID</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   319  306     <span class="s">}</span>
 | 
| 
 | 
   320  307     <span class="k">print</span> <span class="i">$NewTextFileRef</span> <span class="i">JoinWords</span><span class="s">(</span>\<span class="i">@LineWords</span><span class="cm">,</span> <span class="i">$OptionsInfo</span>{<span class="w">OutDelim</span>}<span class="cm">,</span> <span class="i">$OptionsInfo</span>{<span class="w">OutQuote</span>}<span class="s">)</span><span class="cm">,</span> <span class="q">"\n"</span><span class="sc">;</span>
 | 
| 
 | 
   321  308   <span class="s">}</span>
 | 
| 
 | 
   322  309 <span class="s">}</span>
 | 
| 
 | 
   323  310 
 | 
| 
 | 
   324  311 <span class="c"># Open output files...</span>
 | 
| 
 | 
   325  312 <span class="c">#</span>
 | 
| 
 | 
   326 <a name="SetupAndOpenOutputFiles-"></a> 313 <span class="k">sub </span><span class="m">SetupAndOpenOutputFiles</span> <span class="s">{</span>
 | 
| 
 | 
   327  314   <span class="k">my</span><span class="s">(</span><span class="i">$NewSDFileRef</span><span class="cm">,</span> <span class="i">$NewTextFileRef</span><span class="cm">,</span> <span class="i">$NewSDFile</span><span class="cm">,</span> <span class="i">$NewTextFile</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   328  315 
 | 
| 
 | 
   329  316   <span class="s">(</span><span class="i">$NewSDFileRef</span><span class="cm">,</span> <span class="i">$NewTextFileRef</span><span class="s">)</span> = <span class="s">(</span><span class="k">undef</span><span class="s">)</span> x <span class="n">2</span><span class="sc">;</span>
 | 
| 
 | 
   330  317 
 | 
| 
 | 
   331  318   <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">SDOutput</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   332  319     <span class="i">$NewSDFile</span> = <span class="i">$OutputFilesInfo</span>{<span class="w">SDOutFileName</span>}<span class="sc">;</span>
 | 
| 
 | 
   333  320     <span class="k">print</span> <span class="q">"Generating SD file $NewSDFile...\n"</span><span class="sc">;</span>
 | 
| 
 | 
   334  321     <span class="k">open</span> <span class="w">NEWSDFILE</span><span class="cm">,</span> <span class="q">">$NewSDFile"</span> <span class="k">or</span> <span class="k">die</span> <span class="q">"Error: Couldn't open $NewSDFile: $! \n"</span><span class="sc">;</span>
 | 
| 
 | 
   335  322     <span class="i">$NewSDFileRef</span> = \<span class="i">*NEWSDFILE</span><span class="sc">;</span>
 | 
| 
 | 
   336  323   <span class="s">}</span>
 | 
| 
 | 
   337  324 
 | 
| 
 | 
   338  325   <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">TextOutput</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   339  326     <span class="i">$NewTextFile</span> = <span class="i">$OutputFilesInfo</span>{<span class="w">TextOutFileName</span>}<span class="sc">;</span>
 | 
| 
 | 
   340  327     <span class="k">print</span> <span class="q">"Generating text file $NewTextFile...\n"</span><span class="sc">;</span>
 | 
| 
 | 
   341  328     <span class="k">open</span> <span class="w">NEWTEXTFILE</span><span class="cm">,</span> <span class="q">">$NewTextFile"</span> <span class="k">or</span> <span class="k">die</span> <span class="q">"Error: Couldn't open $NewTextFile: $! \n"</span><span class="sc">;</span>
 | 
| 
 | 
   342  329     <span class="i">$NewTextFileRef</span> = \<span class="i">*NEWTEXTFILE</span><span class="sc">;</span>
 | 
| 
 | 
   343  330 
 | 
| 
 | 
   344  331     <span class="i">WriteTextFileCoulmnLabels</span><span class="s">(</span>\<span class="i">*NEWTEXTFILE</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   345  332   <span class="s">}</span>
 | 
| 
 | 
   346  333 
 | 
| 
 | 
   347  334   <span class="k">return</span> <span class="s">(</span><span class="i">$NewSDFileRef</span><span class="cm">,</span> <span class="i">$NewTextFileRef</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   348  335 <span class="s">}</span>
 | 
| 
 | 
   349  336 
 | 
| 
 | 
   350  337 <span class="c"># Write out approriate column labels to text file...</span>
 | 
| 
 | 
   351  338 <span class="c">#</span>
 | 
| 
 | 
   352 <a name="WriteTextFileCoulmnLabels-"></a> 339 <span class="k">sub </span><span class="m">WriteTextFileCoulmnLabels</span> <span class="s">{</span>
 | 
| 
 | 
   353  340   <span class="k">my</span><span class="s">(</span><span class="i">$NewTextFileRef</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   354  341   <span class="k">my</span><span class="s">(</span><span class="i">$Line</span><span class="cm">,</span> <span class="i">@LineWords</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   355  342 
 | 
| 
 | 
   356  343   <span class="i">@LineWords</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   357  344 
 | 
| 
 | 
   358  345   <span class="k">if</span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">IndividualReferenceMode</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   359  346     <span class="k">push</span> <span class="i">@LineWords</span><span class="cm">,</span> <span class="q">qw(ReferenceCompoundID DatabaseCompoundID ComparisonValue)</span><span class="sc">;</span>
 | 
| 
 | 
   360  347   <span class="s">}</span>
 | 
| 
 | 
   361  348   <span class="k">elsif</span> <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">MultipleReferencesMode</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   362  349     <span class="k">push</span> <span class="i">@LineWords</span><span class="cm">,</span> <span class="q">qw(DatabaseCompoundID ComparisonValue)</span><span class="sc">;</span>
 | 
| 
 | 
   363  350   <span class="s">}</span>
 | 
| 
 | 
   364  351 
 | 
| 
 | 
   365  352   <span class="c"># Add columns for other database fingerprints file data to be written to output file...</span>
 | 
| 
 | 
   366  353   <span class="k">if</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputDataFields</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   367  354     <span class="k">push</span> <span class="i">@LineWords</span><span class="cm">,</span> <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataFieldsToOutput</span>}}<span class="sc">;</span>
 | 
| 
 | 
   368  355   <span class="s">}</span>
 | 
| 
 | 
   369  356   <span class="k">elsif</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputDataCols</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   370  357     <span class="k">push</span> <span class="i">@LineWords</span><span class="cm">,</span> <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColLabelsToOutput</span>}}<span class="sc">;</span>
 | 
| 
 | 
   371  358   <span class="s">}</span>
 | 
| 
 | 
   372  359 
 | 
| 
 | 
   373  360   <span class="i">$Line</span> = <span class="i">JoinWords</span><span class="s">(</span>\<span class="i">@LineWords</span><span class="cm">,</span> <span class="i">$OptionsInfo</span>{<span class="w">OutDelim</span>}<span class="cm">,</span> <span class="i">$OptionsInfo</span>{<span class="w">OutQuote</span>}<span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   374  361   <span class="k">print</span> <span class="i">$NewTextFileRef</span> <span class="q">"$Line\n"</span><span class="sc">;</span>
 | 
| 
 | 
   375  362 <span class="s">}</span>
 | 
| 
 | 
   376  363 
 | 
| 
 | 
   377  364 <span class="c"># Write molecule string data to SD output file...</span>
 | 
| 
 | 
   378  365 <span class="c">#</span>
 | 
| 
 | 
   379 <a name="WriteMolStringDataToSDOutputFile-"></a> 366 <span class="k">sub </span><span class="m">WriteMolStringDataToSDOutputFile</span> <span class="s">{</span>
 | 
| 
 | 
   380  367   <span class="k">my</span><span class="s">(</span><span class="i">$DatabaseCmpdID</span><span class="cm">,</span> <span class="i">$NewSDFileRef</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   381  368 
 | 
| 
 | 
   382  369   <span class="k">if</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">CollectCmpdStringData</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   383  370     <span class="k">my</span><span class="s">(</span><span class="i">$MolString</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   384  371 
 | 
| 
 | 
   385  372     <span class="s">(</span><span class="i">$MolString</span><span class="s">)</span> = <span class="k">split</span> <span class="q">/M  END/</span><span class="cm">,</span> <span class="i">$DatabaseFingerprintsFileData</span>{<span class="i">$DatabaseCmpdID</span>}<span class="sc">;</span>
 | 
| 
 | 
   386  373     <span class="k">print</span> <span class="i">$NewSDFileRef</span> <span class="q">"$MolString\nM  END\n"</span><span class="sc">;</span>
 | 
| 
 | 
   387  374   <span class="s">}</span>
 | 
| 
 | 
   388  375   <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
   389  376     <span class="c"># Just write out an empty molecule data string...</span>
 | 
| 
 | 
   390  377     <span class="k">print</span> <span class="i">$NewSDFileRef</span> <span class="i">SDFileUtil::GenerateEmptyCtabBlockLines</span><span class="s">(</span><span class="s">)</span><span class="cm">,</span> <span class="q">"\n"</span><span class="sc">;</span>
 | 
| 
 | 
   391  378   <span class="s">}</span>
 | 
| 
 | 
   392  379 <span class="s">}</span>
 | 
| 
 | 
   393  380 
 | 
| 
 | 
   394  381 <span class="c"># Write database data from SD or Text database file to SD output file...</span>
 | 
| 
 | 
   395  382 <span class="c">#</span>
 | 
| 
 | 
   396 <a name="WriteDatabaseDataToSDOutputFile-"></a> 383 <span class="k">sub </span><span class="m">WriteDatabaseDataToSDOutputFile</span> <span class="s">{</span>
 | 
| 
 | 
   397  384   <span class="k">my</span><span class="s">(</span><span class="i">$DatabaseCmpdID</span><span class="cm">,</span> <span class="i">$NewSDFileRef</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   398  385 
 | 
| 
 | 
   399  386   <span class="k">if</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputDataFields</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   400  387     <span class="k">my</span><span class="s">(</span><span class="i">$DataFieldLabel</span><span class="cm">,</span> <span class="i">$DataFieldValue</span><span class="cm">,</span> <span class="i">@CmpdLines</span><span class="cm">,</span> <span class="i">%DataFieldLabelAndValues</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   401  388 
 | 
| 
 | 
   402  389     <span class="i">@CmpdLines</span> = <span class="k">split</span> <span class="q">/\n/</span><span class="cm">,</span> <span class="i">$DatabaseFingerprintsFileData</span>{<span class="i">$DatabaseCmpdID</span>}<span class="sc">;</span>
 | 
| 
 | 
   403  390     <span class="i">%DataFieldLabelAndValues</span> = <span class="i">GetCmpdDataHeaderLabelsAndValues</span><span class="s">(</span>\<span class="i">@CmpdLines</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   404  391 
 | 
| 
 | 
   405  392     <span class="k">for</span> <span class="i">$DataFieldLabel</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputCurrentDataFields</span>} ? <span class="i">GetCmpdDataHeaderLabels</span><span class="s">(</span>\<span class="i">@CmpdLines</span><span class="s">)</span> <span class="co">:</span> <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataFieldsToOutput</span>}}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   406  393       <span class="i">$DataFieldValue</span> = <span class="k">exists</span> <span class="i">$DataFieldLabelAndValues</span>{<span class="i">$DataFieldLabel</span>} ? <span class="i">$DataFieldLabelAndValues</span>{<span class="i">$DataFieldLabel</span>} <span class="co">:</span> <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
   407  394       <span class="k">print</span> <span class="i">$NewSDFileRef</span>  <span class="q">">  <$DataFieldLabel>\n$DataFieldValue\n\n"</span><span class="sc">;</span>
 | 
| 
 | 
   408  395     <span class="s">}</span>
 | 
| 
 | 
   409  396   <span class="s">}</span>
 | 
| 
 | 
   410  397   <span class="k">elsif</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputDataCols</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   411  398     <span class="k">my</span><span class="s">(</span><span class="i">$DataColNum</span><span class="cm">,</span> <span class="i">$DataFieldLabel</span><span class="cm">,</span> <span class="i">$DataFieldValue</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   412  399 
 | 
| 
 | 
   413  400     <span class="k">for</span> <span class="i">$DataColNum</span> <span class="s">(</span><span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColNumsToOutput</span>}}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   414  401       <span class="i">$DataFieldLabel</span> = <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColNumToLabelMap</span>}{<span class="i">$DataColNum</span>}<span class="sc">;</span>
 | 
| 
 | 
   415  402       <span class="i">$DataFieldValue</span> =  <span class="i">$DatabaseFingerprintsFileData</span>{<span class="i">$DatabaseCmpdID</span>}->[<span class="i">$DataColNum</span>]<span class="sc">;</span>
 | 
| 
 | 
   416  403       <span class="k">print</span> <span class="i">$NewSDFileRef</span>  <span class="q">">  <$DataFieldLabel>\n$DataFieldValue\n\n"</span><span class="sc">;</span>
 | 
| 
 | 
   417  404     <span class="s">}</span>
 | 
| 
 | 
   418  405   <span class="s">}</span>
 | 
| 
 | 
   419  406 <span class="s">}</span>
 | 
| 
 | 
   420  407 
 | 
| 
 | 
   421  408 <span class="c"># Retriebe database data from SD or Text database file for text output file...</span>
 | 
| 
 | 
   422  409 <span class="c">#</span>
 | 
| 
 | 
   423 <a name="RetrieveDatabaseDataForTextOutputFile-"></a> 410 <span class="k">sub </span><span class="m">RetrieveDatabaseDataForTextOutputFile</span> <span class="s">{</span>
 | 
| 
 | 
   424  411   <span class="k">my</span><span class="s">(</span><span class="i">$DatabaseCmpdID</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   425  412 
 | 
| 
 | 
   426  413   <span class="k">if</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputDataFields</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   427  414     <span class="k">my</span><span class="s">(</span><span class="i">@CmpdLines</span><span class="cm">,</span> <span class="i">%DataFieldLabelAndValues</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   428  415 
 | 
| 
 | 
   429  416     <span class="i">@CmpdLines</span> = <span class="k">split</span> <span class="q">/\n/</span><span class="cm">,</span> <span class="i">$DatabaseFingerprintsFileData</span>{<span class="i">$DatabaseCmpdID</span>}<span class="sc">;</span>
 | 
| 
 | 
   430  417     <span class="i">%DataFieldLabelAndValues</span> = <span class="i">GetCmpdDataHeaderLabelsAndValues</span><span class="s">(</span>\<span class="i">@CmpdLines</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   431  418 
 | 
| 
 | 
   432  419     <span class="k">return</span> <span class="k">map</span> <span class="s">{</span> <span class="k">exists</span> <span class="i">$DataFieldLabelAndValues</span>{<span class="i">$_</span>} ? <span class="i">$DataFieldLabelAndValues</span>{<span class="i">$_</span>} <span class="co">:</span> <span class="q">''</span><span class="s">}</span> <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataFieldsToOutput</span>}}<span class="sc">;</span>
 | 
| 
 | 
   433  420   <span class="s">}</span>
 | 
| 
 | 
   434  421   <span class="k">elsif</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputDataCols</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   435  422     <span class="k">if</span> <span class="s">(</span><span class="k">exists</span> <span class="i">$DatabaseFingerprintsFileData</span>{<span class="i">$DatabaseCmpdID</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   436  423       <span class="k">return</span> <span class="k">map</span> <span class="s">{</span> <span class="i">$DatabaseFingerprintsFileData</span>{<span class="i">$DatabaseCmpdID</span>}->[<span class="i">$_</span>] <span class="s">}</span> <span class="s">(</span><span class="n">0</span> .. <span class="i">$#</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColNumsToOutput</span>}}<span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   437  424     <span class="s">}</span>
 | 
| 
 | 
   438  425     <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
   439  426       <span class="k">return</span> <span class="s">(</span><span class="q">''</span><span class="s">)</span> x <span class="i">$#</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColNumsToOutput</span>}}<span class="sc">;</span>
 | 
| 
 | 
   440  427     <span class="s">}</span>
 | 
| 
 | 
   441  428   <span class="s">}</span>
 | 
| 
 | 
   442  429 <span class="s">}</span>
 | 
| 
 | 
   443  430 
 | 
| 
 | 
   444  431 <span class="c"># Collect database file SD compound string or CSV/TSV data line for generating results</span>
 | 
| 
 | 
   445  432 <span class="c"># files..</span>
 | 
| 
 | 
   446  433 <span class="c">#</span>
 | 
| 
 | 
   447 <a name="CollectDatabaseFileData-"></a> 434 <span class="k">sub </span><span class="m">CollectDatabaseFileData</span> <span class="s">{</span>
 | 
| 
 | 
   448  435   <span class="k">my</span><span class="s">(</span><span class="i">$DatabaseCmpdID</span><span class="cm">,</span> <span class="i">$DatabaseFingerprintsFileIO</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   449  436 
 | 
| 
 | 
   450  437   <span class="k">if</span> <span class="s">(</span><span class="k">exists</span> <span class="i">$DatabaseFingerprintsFileData</span>{<span class="i">$DatabaseCmpdID</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   451  438     <span class="k">return</span><span class="sc">;</span>
 | 
| 
 | 
   452  439   <span class="s">}</span>
 | 
| 
 | 
   453  440 
 | 
| 
 | 
   454  441   <span class="k">if</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">CollectCmpdStringData</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   455  442     <span class="i">$DatabaseFingerprintsFileData</span>{<span class="i">$DatabaseCmpdID</span>} = <span class="i">$DatabaseFingerprintsFileIO</span><span class="i">->GetCompoundString</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   456  443   <span class="s">}</span>
 | 
| 
 | 
   457  444 
 | 
| 
 | 
   458  445   <span class="k">if</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">CollectDataLine</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   459  446     <span class="k">my</span><span class="s">(</span><span class="i">@DataLineWords</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   460  447     <span class="i">@DataLineWords</span> = <span class="i">$DatabaseFingerprintsFileIO</span><span class="i">->GetDataLineWords</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   461  448     <span class="i">$DatabaseFingerprintsFileData</span>{<span class="i">$DatabaseCmpdID</span>} = \<span class="i">@DataLineWords</span><span class="sc">;</span>
 | 
| 
 | 
   462  449   <span class="s">}</span>
 | 
| 
 | 
   463  450 
 | 
| 
 | 
   464  451 <span class="s">}</span>
 | 
| 
 | 
   465  452 
 | 
| 
 | 
   466  453 <span class="c"># Read fingerprints data from reference fingerprints file...</span>
 | 
| 
 | 
   467  454 <span class="c">#</span>
 | 
| 
 | 
   468 <a name="ReadReferenceFingerprintsData-"></a> 455 <span class="k">sub </span><span class="m">ReadReferenceFingerprintsData</span> <span class="s">{</span>
 | 
| 
 | 
   469  456   <span class="k">my</span><span class="s">(</span><span class="i">$FingerprintsFileIO</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   470  457 
 | 
| 
 | 
   471  458   <span class="i">$FingerprintsFileIO</span> = <span class="i">Fingerprints::FingerprintsFileUtil::NewFingerprintsFileIO</span><span class="s">(</span><span class="i">%</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FingerprintsFileIOParameters</span>}}<span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   472  459   <span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">ReferenceCmpdIDsRef</span>}<span class="cm">,</span> <span class="i">$SimilaritySearchInfo</span>{<span class="w">ReferenceFingerprintsObjectsRef</span>}<span class="s">)</span> = <span class="i">Fingerprints::FingerprintsFileUtil::ReadAndProcessFingerpritsData</span><span class="s">(</span><span class="i">$FingerprintsFileIO</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   473  460 
 | 
| 
 | 
   474  461 <span class="s">}</span>
 | 
| 
 | 
   475  462 
 | 
| 
 | 
   476  463 <span class="c"># Retrieve information about fingerprints files...</span>
 | 
| 
 | 
   477  464 <span class="c">#</span>
 | 
| 
 | 
   478 <a name="RetrieveFingerprintsFilesInfo-"></a> 465 <span class="k">sub </span><span class="m">RetrieveFingerprintsFilesInfo</span> <span class="s">{</span>
 | 
| 
 | 
   479  466 
 | 
| 
 | 
   480  467   <span class="i">%FingerprintsFilesInfo</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   481  468   <span class="i">%OutputFilesInfo</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   482  469   <span class="i">%SimilaritySearchInfo</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   483  470 
 | 
| 
 | 
   484  471   <span class="i">%</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}} = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   485  472   <span class="i">%</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}} = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   486  473 
 | 
| 
 | 
   487  474   <span class="c"># Set up reference and database file names...</span>
 | 
| 
 | 
   488  475   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FileName</span>} = <span class="i">$FingerprintsFilesList</span>[<span class="n">0</span>]<span class="sc">;</span>
 | 
| 
 | 
   489  476   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">FileName</span>} = <span class="i">$FingerprintsFilesList</span>[<span class="n">1</span>]<span class="sc">;</span>
 | 
| 
 | 
   490  477 
 | 
| 
 | 
   491  478   <span class="c"># Retrieve information about reference and database fingerprints file...</span>
 | 
| 
 | 
   492  479   <span class="i">RetrieveReferenceFingerprintsFileInfo</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   493  480   <span class="i">RetrieveDatabaseFingerprintsFileInfo</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   494  481 
 | 
| 
 | 
   495  482   <span class="c"># Setup fingerprints comparison method and associated method parameters...</span>
 | 
| 
 | 
   496  483   <span class="i">SetupReferenceAndDatabaseFingerprintsComparisonInfo</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   497  484 
 | 
| 
 | 
   498  485   <span class="c"># Retrieve information for output files...</span>
 | 
| 
 | 
   499  486   <span class="i">RetrieveOutputFilesInfo</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   500  487 <span class="s">}</span>
 | 
| 
 | 
   501  488 
 | 
| 
 | 
   502  489 <span class="c"># Setup refrerence and database fingerprints comparison method and associated method parameters...</span>
 | 
| 
 | 
   503  490 <span class="c">#</span>
 | 
| 
 | 
   504 <a name="SetupReferenceAndDatabaseFingerprintsComparisonInfo-"></a> 491 <span class="k">sub </span><span class="m">SetupReferenceAndDatabaseFingerprintsComparisonInfo</span> <span class="s">{</span>
 | 
| 
 | 
   505  492 
 | 
| 
 | 
   506  493   <span class="c"># Make sure reference and database fingerprints string match...</span>
 | 
| 
 | 
   507  494   <span class="k">if</span> <span class="s">(</span><span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FirstFingerprintsStringType</span>} !~ <span class="q">/^$FingerprintsFilesInfo{Database}{FirstFingerprintsStringType}$/i</span><span class="s">)</span> ||
 | 
| 
 | 
   508  495      <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FingerprintsBitVectorStringMode</span>} != <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">FingerprintsBitVectorStringMode</span>}<span class="s">)</span> ||
 | 
| 
 | 
   509  496      <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FingerprintsVectorStringMode</span>} != <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">FingerprintsVectorStringMode</span>}<span class="s">)</span> <span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   510  497     <span class="k">die</span> <span class="q">"Error: First reference fingerprints string type, $FingerprintsFilesInfo{Reference}{FirstFingerprintsStringType}, must match first database fingerprints type, $FingerprintsFilesInfo{Database}{FirstFingerprintsStringType}.\n"</span><span class="sc">;</span>
 | 
| 
 | 
   511  498   <span class="s">}</span>
 | 
| 
 | 
   512  499 
 | 
| 
 | 
   513  500   <span class="k">if</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FirstFingerprintsStringDescription</span>} !~ <span class="q">/^$FingerprintsFilesInfo{Database}{FirstFingerprintsStringDescription}$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   514  501     <span class="k">warn</span> <span class="q">"Warning: First reference fingerprints string description, $FingerprintsFilesInfo{Reference}{FirstFingerprintsStringDescription}, doesn't match first database fingerprints string description, $FingerprintsFilesInfo{Database}{FirstFingerprintsStringDescription}.\n"</span><span class="sc">;</span>
 | 
| 
 | 
   515  502   <span class="s">}</span>
 | 
| 
 | 
   516  503 
 | 
| 
 | 
   517  504   <span class="c"># Setup individual reference and multiple references search mode...</span>
 | 
| 
 | 
   518  505   <span class="i">$SimilaritySearchInfo</span>{<span class="w">IndividualReferenceMode</span>} = <span class="k">undef</span><span class="sc">;</span>
 | 
| 
 | 
   519  506   <span class="i">$SimilaritySearchInfo</span>{<span class="w">MultipleReferencesMode</span>} = <span class="k">undef</span><span class="sc">;</span>
 | 
| 
 | 
   520  507 
 | 
| 
 | 
   521  508   <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">Mode</span>} =~ <span class="q">/^IndividualReference$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   522  509     <span class="i">$SimilaritySearchInfo</span>{<span class="w">IndividualReferenceMode</span>} = <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
   523  510   <span class="s">}</span>
 | 
| 
 | 
   524  511   <span class="k">elsif</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">Mode</span>} =~ <span class="q">/^MultipleReferences$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   525  512     <span class="i">$SimilaritySearchInfo</span>{<span class="w">MultipleReferencesMode</span>} = <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
   526  513   <span class="s">}</span>
 | 
| 
 | 
   527  514   <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
   528  515     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{mode}, for option \"-m, --mode\" is not valid. Allowed values: IndividualReference, MultipleReferences\n"</span><span class="sc">;</span>
 | 
| 
 | 
   529  516   <span class="s">}</span>
 | 
| 
 | 
   530  517 
 | 
| 
 | 
   531  518   <span class="c"># Set up reference and database fingerprints similarity search method and paramaters...</span>
 | 
| 
 | 
   532  519   <span class="k">my</span><span class="s">(</span><span class="i">$ComparisonMeasure</span><span class="cm">,</span> <span class="i">$ComparisonMethod</span><span class="cm">,</span> <span class="i">$ApplyComparisonCutoff</span><span class="cm">,</span> <span class="i">$ComparisonCutoff</span><span class="cm">,</span> <span class="i">$KeepTop</span><span class="cm">,</span> <span class="i">@ComparisonMethodParameters</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   533  520 
 | 
| 
 | 
   534  521   <span class="i">$SimilaritySearchInfo</span>{<span class="w">ComparisonMethod</span>} = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
   535  522   <span class="i">@</span>{<span class="i">$SimilaritySearchInfo</span>{<span class="w">ComparisonMethodParameters</span>}} = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   536  523 
 | 
| 
 | 
   537  524   <span class="i">$SimilaritySearchInfo</span>{<span class="w">ComparisonCutoff</span>} = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
   538  525   <span class="i">$SimilaritySearchInfo</span>{<span class="w">KeepTop</span>} = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
   539  526 
 | 
| 
 | 
   540  527   <span class="i">$ComparisonMeasure</span> = <span class="q">''</span><span class="sc">;</span> <span class="i">$ComparisonMethod</span> = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
   541  528   <span class="i">@ComparisonMethodParameters</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   542  529 
 | 
| 
 | 
   543  530   <span class="j">FINGERPRINTSTYPE:</span> <span class="s">{</span>
 | 
| 
 | 
   544  531     <span class="k">if</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FingerprintsBitVectorStringMode</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   545  532       <span class="i">$ComparisonMeasure</span> = <span class="i">$OptionsInfo</span>{<span class="w">SpecifiedBitVectorComparisonMeasure</span>}<span class="sc">;</span>
 | 
| 
 | 
   546  533       <span class="i">$ComparisonMethod</span> = <span class="i">$OptionsInfo</span>{<span class="w">SpecifiedBitVectorComparisonMeasureMethod</span>}<span class="sc">;</span>
 | 
| 
 | 
   547  534 
 | 
| 
 | 
   548  535       <span class="k">if</span> <span class="s">(</span><span class="i">$ComparisonMeasure</span> =~ <span class="q">/^TverskySimilarity$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   549  536         <span class="k">push</span> <span class="i">@ComparisonMethodParameters</span><span class="cm">,</span> <span class="i">$OptionsInfo</span>{<span class="w">Alpha</span>}<span class="sc">;</span>
 | 
| 
 | 
   550  537       <span class="s">}</span>
 | 
| 
 | 
   551  538       <span class="k">elsif</span> <span class="s">(</span><span class="i">$ComparisonMeasure</span> =~ <span class="q">/^WeightedTverskySimilarity$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   552  539         <span class="k">push</span> <span class="i">@ComparisonMethodParameters</span><span class="cm">,</span> <span class="i">$OptionsInfo</span>{<span class="w">Alpha</span>}<span class="sc">;</span>
 | 
| 
 | 
   553  540         <span class="k">push</span> <span class="i">@ComparisonMethodParameters</span><span class="cm">,</span> <span class="i">$OptionsInfo</span>{<span class="w">Beta</span>}<span class="sc">;</span>
 | 
| 
 | 
   554  541       <span class="s">}</span>
 | 
| 
 | 
   555  542       <span class="k">elsif</span> <span class="s">(</span><span class="i">$ComparisonMeasure</span> =~ <span class="q">/^WeightedTanimotoSimilarity$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   556  543         <span class="k">push</span> <span class="i">@ComparisonMethodParameters</span><span class="cm">,</span> <span class="i">$OptionsInfo</span>{<span class="w">Beta</span>}<span class="sc">;</span>
 | 
| 
 | 
   557  544       <span class="s">}</span>
 | 
| 
 | 
   558  545 
 | 
| 
 | 
   559  546       <span class="k">last</span> <span class="j">FINGERPRINTSTYPE</span><span class="sc">;</span>
 | 
| 
 | 
   560  547     <span class="s">}</span>
 | 
| 
 | 
   561  548     <span class="k">if</span> <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FingerprintsVectorStringMode</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   562  549       <span class="k">my</span><span class="s">(</span><span class="i">$SkipValuesCheck</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   563  550 
 | 
| 
 | 
   564  551       <span class="i">$ComparisonMeasure</span> = <span class="i">$OptionsInfo</span>{<span class="w">SpecifiedVectorComparisonMeasure</span>}<span class="sc">;</span>
 | 
| 
 | 
   565  552       <span class="i">$ComparisonMethod</span> = <span class="i">$OptionsInfo</span>{<span class="w">SpecifiedVectorComparisonMeasuresMethod</span>}<span class="sc">;</span>
 | 
| 
 | 
   566  553 
 | 
| 
 | 
   567  554       <span class="k">push</span> <span class="i">@ComparisonMethodParameters</span><span class="cm">,</span> <span class="i">$OptionsInfo</span>{<span class="w">SpecifiedVectorComparisonMode</span>}<span class="sc">;</span>
 | 
| 
 | 
   568  555 
 | 
| 
 | 
   569  556       <span class="i">$SkipValuesCheck</span> = <span class="i">$OptionsInfo</span>{<span class="w">Fast</span>} ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
   570  557       <span class="k">push</span> <span class="i">@ComparisonMethodParameters</span><span class="cm">,</span> <span class="i">$SkipValuesCheck</span><span class="sc">;</span>
 | 
| 
 | 
   571  558 
 | 
| 
 | 
   572  559       <span class="k">last</span> <span class="j">FINGERPRINTSTYPE</span><span class="sc">;</span>
 | 
| 
 | 
   573  560     <span class="s">}</span>
 | 
| 
 | 
   574  561     <span class="k">die</span> <span class="q">"Error: Uknown fingerprints string type. Supported values: FingerprintsBitVectorString or FingerprintsVectorString.\n"</span><span class="sc">;</span>
 | 
| 
 | 
   575  562   <span class="s">}</span>
 | 
| 
 | 
   576  563 
 | 
| 
 | 
   577  564   <span class="i">$ApplyComparisonCutoff</span> = <span class="i">$SimilaritySearchInfo</span>{<span class="w">IndividualReferenceMode</span>} ? <span class="n">1</span> <span class="co">:</span> <span class="s">(</span><span class="s">(</span><span class="i">$SimilaritySearchInfo</span>{<span class="w">MultipleReferencesMode</span>} && <span class="i">$OptionsInfo</span>{<span class="w">GroupFusionApplyCutoff</span>}<span class="s">)</span> ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   578  565 
 | 
| 
 | 
   579  566   <span class="i">$ComparisonCutoff</span> = <span class="q">''</span><span class="sc">;</span> <span class="i">$KeepTop</span> = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
   580  567   <span class="k">if</span> <span class="s">(</span><span class="i">$ComparisonMethod</span> =~ <span class="q">/Distance/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   581  568     <span class="i">$ComparisonCutoff</span> = <span class="i">$OptionsInfo</span>{<span class="w">DistanceCutoff</span>}<span class="sc">;</span>
 | 
| 
 | 
   582  569     <span class="i">$KeepTop</span> = <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">SearchMode</span>} =~ <span class="q">/^SimilaritySearch$/i</span><span class="s">)</span> ? <span class="n">0</span> <span class="co">:</span> <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
   583  570   <span class="s">}</span>
 | 
| 
 | 
   584  571   <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
   585  572     <span class="i">$ComparisonCutoff</span> = <span class="i">$OptionsInfo</span>{<span class="w">SimilarityCutoff</span>}<span class="sc">;</span>
 | 
| 
 | 
   586  573     <span class="i">$KeepTop</span> = <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">SearchMode</span>} =~ <span class="q">/^SimilaritySearch$/i</span><span class="s">)</span> ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
   587  574   <span class="s">}</span>
 | 
| 
 | 
   588  575 
 | 
| 
 | 
   589  576   <span class="i">$SimilaritySearchInfo</span>{<span class="w">ComparisonMethod</span>} = <span class="i">$ComparisonMethod</span><span class="sc">;</span>
 | 
| 
 | 
   590  577   <span class="i">@</span>{<span class="i">$SimilaritySearchInfo</span>{<span class="w">ComparisonMethodParameters</span>}} = <span class="i">@ComparisonMethodParameters</span><span class="sc">;</span>
 | 
| 
 | 
   591  578 
 | 
| 
 | 
   592  579   <span class="i">$SimilaritySearchInfo</span>{<span class="w">ComparisonCutoff</span>} = <span class="i">$ComparisonCutoff</span><span class="sc">;</span>
 | 
| 
 | 
   593  580   <span class="i">$SimilaritySearchInfo</span>{<span class="w">KeepTop</span>} = <span class="i">$KeepTop</span><span class="sc">;</span>
 | 
| 
 | 
   594  581   <span class="i">$SimilaritySearchInfo</span>{<span class="w">ApplyComparisonCutoff</span>} = <span class="i">$ApplyComparisonCutoff</span><span class="sc">;</span>
 | 
| 
 | 
   595  582 
 | 
| 
 | 
   596  583   <span class="c"># Setup references to group fusion methods...</span>
 | 
| 
 | 
   597  584   <span class="i">$SimilaritySearchInfo</span>{<span class="w">GroupFusionMethodRef</span>} = <span class="k">undef</span><span class="sc">;</span>
 | 
| 
 | 
   598  585   <span class="i">$SimilaritySearchInfo</span>{<span class="w">ApplyPrecisionDuringFusion</span>} = <span class="k">undef</span><span class="sc">;</span>
 | 
| 
 | 
   599  586 
 | 
| 
 | 
   600  587   <span class="j">FUSIONRULE:</span> <span class="s">{</span>
 | 
| 
 | 
   601  588     <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">GroupFusionRule</span>} =~ <span class="q">/^Max$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   602  589       <span class="c"># It's always the first value in the appropriated sorted list using value of KeepTop...</span>
 | 
| 
 | 
   603  590       <span class="i">$SimilaritySearchInfo</span>{<span class="w">GroupFusionMethodRef</span>} = <span class="k">sub</span> <span class="s">{</span> <span class="k">my</span><span class="s">(</span><span class="i">$ComparisonValuesRef</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span> <span class="k">return</span> <span class="i">$ComparisonValuesRef</span>->[<span class="n">0</span>]<span class="sc">;</span> <span class="s">}</span><span class="sc">;</span>
 | 
| 
 | 
   604  591       <span class="k">last</span> <span class="j">FUSIONRULE</span><span class="sc">;</span>
 | 
| 
 | 
   605  592     <span class="s">}</span>
 | 
| 
 | 
   606  593     <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">GroupFusionRule</span>} =~ <span class="q">/^Min$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   607  594       <span class="c"># It's always the last value in the appropriated sorted list using value of KeepTop...</span>
 | 
| 
 | 
   608  595       <span class="i">$SimilaritySearchInfo</span>{<span class="w">GroupFusionMethodRef</span>} = <span class="k">sub</span> <span class="s">{</span> <span class="k">my</span><span class="s">(</span><span class="i">$ComparisonValuesRef</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span> <span class="k">return</span> <span class="i">$ComparisonValuesRef</span>->[<span class="i">$#</span>{<span class="i">$ComparisonValuesRef</span>}]<span class="sc">;</span> <span class="s">}</span><span class="sc">;</span>
 | 
| 
 | 
   609  596       <span class="k">last</span> <span class="j">FUSIONRULE</span><span class="sc">;</span>
 | 
| 
 | 
   610  597     <span class="s">}</span>
 | 
| 
 | 
   611  598     <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">GroupFusionRule</span>} =~ <span class="q">/^Mean$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   612  599       <span class="i">$SimilaritySearchInfo</span>{<span class="w">GroupFusionMethodRef</span>} = \<span class="i">&StatisticsUtil::Mean</span><span class="sc">;</span>
 | 
| 
 | 
   613  600       <span class="i">$SimilaritySearchInfo</span>{<span class="w">ApplyPrecisionDuringFusion</span>} = <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
   614  601       <span class="k">last</span> <span class="j">FUSIONRULE</span><span class="sc">;</span>
 | 
| 
 | 
   615  602     <span class="s">}</span>
 | 
| 
 | 
   616  603     <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">GroupFusionRule</span>} =~ <span class="q">/^Median$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   617  604       <span class="i">$SimilaritySearchInfo</span>{<span class="w">GroupFusionMethodRef</span>} = \<span class="i">&StatisticsUtil::Median</span><span class="sc">;</span>
 | 
| 
 | 
   618  605       <span class="i">$SimilaritySearchInfo</span>{<span class="w">ApplyPrecisionDuringFusion</span>} = <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
   619  606       <span class="k">last</span> <span class="j">FUSIONRULE</span><span class="sc">;</span>
 | 
| 
 | 
   620  607     <span class="s">}</span>
 | 
| 
 | 
   621  608     <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">GroupFusionRule</span>} =~ <span class="q">/^Sum$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   622  609       <span class="i">$SimilaritySearchInfo</span>{<span class="w">GroupFusionMethodRef</span>} = \<span class="i">&StatisticsUtil::Sum</span><span class="sc">;</span>
 | 
| 
 | 
   623  610       <span class="i">$SimilaritySearchInfo</span>{<span class="w">ApplyPrecisionDuringFusion</span>} = <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
   624  611       <span class="k">last</span> <span class="j">FUSIONRULE</span><span class="sc">;</span>
 | 
| 
 | 
   625  612     <span class="s">}</span>
 | 
| 
 | 
   626  613     <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">GroupFusionRule</span>} =~ <span class="q">/^Euclidean$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   627  614       <span class="i">$SimilaritySearchInfo</span>{<span class="w">GroupFusionMethodRef</span>} = \<span class="i">&StatisticsUtil::Euclidean</span><span class="sc">;</span>
 | 
| 
 | 
   628  615       <span class="i">$SimilaritySearchInfo</span>{<span class="w">ApplyPrecisionDuringFusion</span>} = <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
   629  616       <span class="k">last</span> <span class="j">FUSIONRULE</span><span class="sc">;</span>
 | 
| 
 | 
   630  617     <span class="s">}</span>
 | 
| 
 | 
   631  618     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{groupfusionrule}, for option \"-g, --GroupFusionRule\" is not valid. Allowed values: Max, Min, Mean, Median, Sum, Euclidean\n"</span><span class="sc">;</span>
 | 
| 
 | 
   632  619   <span class="s">}</span>
 | 
| 
 | 
   633  620 
 | 
| 
 | 
   634  621   <span class="i">$SimilaritySearchInfo</span>{<span class="w">UsekNN</span>} = <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">kNN</span>} !~ <span class="q">/^All$/i</span><span class="s">)</span> ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
   635  622   <span class="i">$SimilaritySearchInfo</span>{<span class="w">SortComparisonValues</span>} = <span class="s">(</span><span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">GroupFusionRule</span>} =~ <span class="q">/^(Max|Min)$/i</span><span class="s">)</span> || <span class="i">$SimilaritySearchInfo</span>{<span class="w">UsekNN</span>}<span class="s">)</span> ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
   636  623 <span class="s">}</span>
 | 
| 
 | 
   637  624 
 | 
| 
 | 
   638  625 <span class="c"># Retrieve information about reference fingerprints file...</span>
 | 
| 
 | 
   639  626 <span class="c">#</span>
 | 
| 
 | 
   640 <a name="RetrieveReferenceFingerprintsFileInfo-"></a> 627 <span class="k">sub </span><span class="m">RetrieveReferenceFingerprintsFileInfo</span> <span class="s">{</span>
 | 
| 
 | 
   641  628   <span class="k">my</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="cm">,</span> <span class="i">$FileType</span><span class="cm">,</span> <span class="i">$InDelim</span><span class="cm">,</span> <span class="i">$FingerprintsFileIO</span><span class="cm">,</span> <span class="i">$FingerprintsStringMode</span><span class="cm">,</span> <span class="i">$FingerprintsBitVectorStringMode</span><span class="cm">,</span> <span class="i">$FingerprintsVectorStringMode</span><span class="cm">,</span> <span class="i">$FirstFingerprintsStringType</span><span class="cm">,</span> <span class="i">$FirstFingerprintsStringDescription</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   642  629 
 | 
| 
 | 
   643  630   <span class="i">$FingerprintsFile</span> = <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FileName</span>}<span class="sc">;</span>
 | 
| 
 | 
   644  631   <span class="s">(</span><span class="i">$FileType</span><span class="cm">,</span> <span class="i">$InDelim</span><span class="s">)</span> =  <span class="i">RetrieveFingerprintsFileInfo</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   645  632 
 | 
| 
 | 
   646  633   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FileType</span>} = <span class="i">$FileType</span><span class="sc">;</span>
 | 
| 
 | 
   647  634   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">InDelim</span>} = <span class="i">$InDelim</span><span class="sc">;</span>
 | 
| 
 | 
   648  635 
 | 
| 
 | 
   649  636   <span class="c"># Setup reference FingerprintsFileIO parameters...</span>
 | 
| 
 | 
   650  637   <span class="i">%</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FingerprintsFileIOParameters</span>}} = <span class="i">RetrieveFingerprintsFileIOParameters</span><span class="s">(</span><span class="q">'Reference'</span><span class="cm">,</span> <span class="i">$FileType</span><span class="cm">,</span> <span class="i">$FingerprintsFile</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   651  638 
 | 
| 
 | 
   652  639   <span class="c"># Make sure reference fingerprints data file contains valid and retrieve fingerprints string mode information...</span>
 | 
| 
 | 
   653  640   <span class="s">(</span><span class="i">$FingerprintsStringMode</span><span class="cm">,</span> <span class="i">$FingerprintsBitVectorStringMode</span><span class="cm">,</span> <span class="i">$FingerprintsVectorStringMode</span><span class="cm">,</span> <span class="i">$FirstFingerprintsStringType</span><span class="cm">,</span> <span class="i">$FirstFingerprintsStringDescription</span><span class="s">)</span> = <span class="i">RetrieveFingerprintsFileFingerprintsStringInfo</span><span class="s">(</span><span class="q">'Reference'</span><span class="cm">,</span> <span class="i">$FingerprintsFile</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   654  641   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FingerprintsStringMode</span>} = <span class="i">$FingerprintsStringMode</span><span class="sc">;</span>
 | 
| 
 | 
   655  642   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FingerprintsBitVectorStringMode</span>} = <span class="i">$FingerprintsBitVectorStringMode</span><span class="sc">;</span>
 | 
| 
 | 
   656  643   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FingerprintsVectorStringMode</span>} = <span class="i">$FingerprintsVectorStringMode</span><span class="sc">;</span>
 | 
| 
 | 
   657  644   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FirstFingerprintsStringType</span>} = <span class="i">$FirstFingerprintsStringType</span><span class="sc">;</span>
 | 
| 
 | 
   658  645   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FirstFingerprintsStringDescription</span>} = <span class="i">$FirstFingerprintsStringDescription</span><span class="sc">;</span>
 | 
| 
 | 
   659  646 
 | 
| 
 | 
   660  647 <span class="s">}</span>
 | 
| 
 | 
   661  648 
 | 
| 
 | 
   662  649 <span class="c"># Retrieve information about database fingerprints file...</span>
 | 
| 
 | 
   663  650 <span class="c">#</span>
 | 
| 
 | 
   664 <a name="RetrieveDatabaseFingerprintsFileInfo-"></a> 651 <span class="k">sub </span><span class="m">RetrieveDatabaseFingerprintsFileInfo</span> <span class="s">{</span>
 | 
| 
 | 
   665  652   <span class="k">my</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="cm">,</span> <span class="i">$FileType</span><span class="cm">,</span> <span class="i">$InDelim</span><span class="cm">,</span> <span class="i">$FingerprintsFileIO</span><span class="cm">,</span> <span class="i">$FingerprintsStringMode</span><span class="cm">,</span> <span class="i">$FingerprintsBitVectorStringMode</span><span class="cm">,</span> <span class="i">$FingerprintsVectorStringMode</span><span class="cm">,</span> <span class="i">$FirstFingerprintsStringType</span><span class="cm">,</span> <span class="i">$FirstFingerprintsStringDescription</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   666  653 
 | 
| 
 | 
   667  654   <span class="i">$FingerprintsFile</span> = <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">FileName</span>}<span class="sc">;</span>
 | 
| 
 | 
   668  655   <span class="s">(</span><span class="i">$FileType</span><span class="cm">,</span> <span class="i">$InDelim</span><span class="s">)</span> =  <span class="i">RetrieveFingerprintsFileInfo</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   669  656 
 | 
| 
 | 
   670  657   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">FileType</span>} = <span class="i">$FileType</span><span class="sc">;</span>
 | 
| 
 | 
   671  658   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">InDelim</span>} = <span class="i">$InDelim</span><span class="sc">;</span>
 | 
| 
 | 
   672  659 
 | 
| 
 | 
   673  660   <span class="c"># Setup reference FingerprintsFileIO parameters...</span>
 | 
| 
 | 
   674  661   <span class="i">%</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">FingerprintsFileIOParameters</span>}} = <span class="i">RetrieveFingerprintsFileIOParameters</span><span class="s">(</span><span class="q">'Database'</span><span class="cm">,</span> <span class="i">$FileType</span><span class="cm">,</span> <span class="i">$FingerprintsFile</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   675  662 
 | 
| 
 | 
   676  663   <span class="c"># Make sure database fingerprints data file contains valid and retrieve fingerprints string mode information...</span>
 | 
| 
 | 
   677  664   <span class="s">(</span><span class="i">$FingerprintsStringMode</span><span class="cm">,</span> <span class="i">$FingerprintsBitVectorStringMode</span><span class="cm">,</span> <span class="i">$FingerprintsVectorStringMode</span><span class="cm">,</span> <span class="i">$FirstFingerprintsStringType</span><span class="cm">,</span> <span class="i">$FirstFingerprintsStringDescription</span><span class="s">)</span> = <span class="i">RetrieveFingerprintsFileFingerprintsStringInfo</span><span class="s">(</span><span class="q">'Database'</span><span class="cm">,</span> <span class="i">$FingerprintsFile</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   678  665   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">FingerprintsStringMode</span>} = <span class="i">$FingerprintsStringMode</span><span class="sc">;</span>
 | 
| 
 | 
   679  666   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">FingerprintsBitVectorStringMode</span>} = <span class="i">$FingerprintsBitVectorStringMode</span><span class="sc">;</span>
 | 
| 
 | 
   680  667   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">FingerprintsVectorStringMode</span>} = <span class="i">$FingerprintsVectorStringMode</span><span class="sc">;</span>
 | 
| 
 | 
   681  668   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">FirstFingerprintsStringType</span>} = <span class="i">$FirstFingerprintsStringType</span><span class="sc">;</span>
 | 
| 
 | 
   682  669   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">FirstFingerprintsStringDescription</span>} = <span class="i">$FirstFingerprintsStringDescription</span><span class="sc">;</span>
 | 
| 
 | 
   683  670 
 | 
| 
 | 
   684  671   <span class="c"># Retrieve database fingerprints data field information for output file...</span>
 | 
| 
 | 
   685  672   <span class="c">#</span>
 | 
| 
 | 
   686  673   <span class="i">RetrieveDatabaseFingerprintsDataFieldsInfo</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="cm">,</span> <span class="i">$FileType</span><span class="cm">,</span> <span class="i">$InDelim</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   687  674 
 | 
| 
 | 
   688  675   <span class="c"># Retrieve database fingerprints text file data columns information for output file...</span>
 | 
| 
 | 
   689  676   <span class="c">#</span>
 | 
| 
 | 
   690  677   <span class="i">RetrieveDatabaseFingerprintsDataColsInfo</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="cm">,</span> <span class="i">$FileType</span><span class="cm">,</span> <span class="i">$InDelim</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   691  678 
 | 
| 
 | 
   692  679   <span class="c"># Any need to collect database compound string or data line for generation of results files...</span>
 | 
| 
 | 
   693  680   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">CollectCmpdStringData</span>} = <span class="s">(</span><span class="i">$FileType</span> =~ <span class="q">/^SD$/i</span><span class="s">)</span> ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
   694  681   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">CollectDataLine</span>} = <span class="s">(</span><span class="i">$FileType</span> =~ <span class="q">/^Text$/i</span> && <span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataColsMode</span>} =~ <span class="q">/^(All|Specify)$/i</span><span class="s">)</span> ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
   695  682   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">CollectInputFileData</span>} = <span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">CollectCmpdStringData</span>} || <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">CollectDataLine</span>}<span class="s">)</span> ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
   696  683 
 | 
| 
 | 
   697  684   <span class="c"># Set maximum number of similar compounds to find for individual reference of set of multiple</span>
 | 
| 
 | 
   698  685   <span class="c"># reference compounds...</span>
 | 
| 
 | 
   699  686   <span class="c">#</span>
 | 
| 
 | 
   700  687   <span class="i">SetMaximumSimilarMoleculesToRetrieve</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="cm">,</span> <span class="i">$FileType</span><span class="cm">,</span> <span class="i">$InDelim</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   701  688 <span class="s">}</span>
 | 
| 
 | 
   702  689 
 | 
| 
 | 
   703  690 <span class="c"># Retrieve database fingerprints data field information...</span>
 | 
| 
 | 
   704  691 <span class="c">#</span>
 | 
| 
 | 
   705 <a name="RetrieveDatabaseFingerprintsDataFieldsInfo-"></a> 692 <span class="k">sub </span><span class="m">RetrieveDatabaseFingerprintsDataFieldsInfo</span> <span class="s">{</span>
 | 
| 
 | 
   706  693   <span class="k">my</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="cm">,</span> <span class="i">$FileType</span><span class="cm">,</span> <span class="i">$InDelim</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   707  694   <span class="k">my</span><span class="s">(</span><span class="i">$CollectDataFields</span><span class="cm">,</span> <span class="i">$CmpdCount</span><span class="cm">,</span> <span class="i">$AllDataFieldsRef</span><span class="cm">,</span> <span class="i">$CommonDataFieldsRef</span><span class="cm">,</span> <span class="i">@DataFieldsToOutput</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   708  695 
 | 
| 
 | 
   709  696   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputDataFields</span>} = <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
   710  697   <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataFieldsToOutput</span>}} = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   711  698 
 | 
| 
 | 
   712  699   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputCurrentDataFields</span>} = <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
   713  700 
 | 
| 
 | 
   714  701   <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">AllDataFields</span>}} = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   715  702   <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">CommonDataFields</span>}} = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   716  703   <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">SpecifiedDatabaseDataFields</span>}} = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   717  704 
 | 
| 
 | 
   718  705   <span class="k">if</span> <span class="s">(</span><span class="i">$FileType</span> !~ <span class="q">/^SD$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   719  706     <span class="k">return</span><span class="sc">;</span>
 | 
| 
 | 
   720  707   <span class="s">}</span>
 | 
| 
 | 
   721  708 
 | 
| 
 | 
   722  709   <span class="c"># No need to go over SD file and collect data fields for SD file during All DatabaseDataFieldsMode as</span>
 | 
| 
 | 
   723  710   <span class="c"># they would be retrieved from database SD file compound string during generation of output files...</span>
 | 
| 
 | 
   724  711   <span class="c">#</span>
 | 
| 
 | 
   725  712   <span class="i">$CollectDataFields</span> = <span class="s">(</span><span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">TextOutput</span>} && <span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataFieldsMode</span>} =~ <span class="q">/^(All|Common)$/i</span><span class="s">)</span> || <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">SDOutput</span>} && <span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataFieldsMode</span>} =~ <span class="q">/^Common$/i</span><span class="s">)</span><span class="s">)</span> ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
   726  713 
 | 
| 
 | 
   727  714   <span class="s">(</span><span class="i">$CmpdCount</span><span class="cm">,</span> <span class="i">$AllDataFieldsRef</span><span class="cm">,</span> <span class="i">$CommonDataFieldsRef</span><span class="s">)</span> = <span class="s">(</span><span class="k">undef</span><span class="s">)</span> x <span class="n">2</span><span class="sc">;</span>
 | 
| 
 | 
   728  715 
 | 
| 
 | 
   729  716   <span class="k">if</span> <span class="s">(</span><span class="i">$CollectDataFields</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   730  717     <span class="k">open</span> <span class="w">SDFILE</span><span class="cm">,</span> <span class="q">"$FingerprintsFile"</span> <span class="k">or</span> <span class="k">die</span> <span class="q">"Error: Couldn't open $FingerprintsFile: $! \n"</span><span class="sc">;</span>
 | 
| 
 | 
   731  718     <span class="s">(</span><span class="i">$CmpdCount</span><span class="cm">,</span> <span class="i">$AllDataFieldsRef</span><span class="cm">,</span> <span class="i">$CommonDataFieldsRef</span><span class="s">)</span> = <span class="i">GetAllAndCommonCmpdDataHeaderLabels</span><span class="s">(</span>\<span class="i">*SDFILE</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   732  719     <span class="k">close</span> <span class="w">SDFILE</span><span class="sc">;</span>
 | 
| 
 | 
   733  720   <span class="s">}</span>
 | 
| 
 | 
   734  721 
 | 
| 
 | 
   735  722   <span class="i">@DataFieldsToOutput</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   736  723   <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataFieldsMode</span>} =~ <span class="q">/^All$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   737  724     <span class="k">if</span> <span class="s">(</span><span class="k">defined</span> <span class="i">$AllDataFieldsRef</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   738  725       <span class="k">push</span> <span class="i">@DataFieldsToOutput</span><span class="cm">,</span> <span class="i">@</span>{<span class="i">$AllDataFieldsRef</span>}<span class="sc">;</span>
 | 
| 
 | 
   739  726       <span class="k">push</span> <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">AllDataFields</span>}}<span class="cm">,</span> <span class="i">@</span>{<span class="i">$AllDataFieldsRef</span>}<span class="sc">;</span>
 | 
| 
 | 
   740  727     <span class="s">}</span>
 | 
| 
 | 
   741  728     <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
   742  729       <span class="c"># Retrieve and output data fields and values dynamically...</span>
 | 
| 
 | 
   743  730       <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputCurrentDataFields</span>} = <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
   744  731     <span class="s">}</span>
 | 
| 
 | 
   745  732   <span class="s">}</span>
 | 
| 
 | 
   746  733   <span class="k">elsif</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataFieldsMode</span>} =~ <span class="q">/^Common$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   747  734     <span class="k">if</span> <span class="s">(</span><span class="k">defined</span> <span class="i">$CommonDataFieldsRef</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   748  735       <span class="k">push</span> <span class="i">@DataFieldsToOutput</span><span class="cm">,</span> <span class="i">@</span>{<span class="i">$CommonDataFieldsRef</span>}<span class="sc">;</span>
 | 
| 
 | 
   749  736       <span class="k">push</span> <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">CommonDataFields</span>}}<span class="cm">,</span> <span class="i">@</span>{<span class="i">$CommonDataFieldsRef</span>}<span class="sc">;</span>
 | 
| 
 | 
   750  737     <span class="s">}</span>
 | 
| 
 | 
   751  738   <span class="s">}</span>
 | 
| 
 | 
   752  739   <span class="k">elsif</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataFieldsMode</span>} =~ <span class="q">/^Specify$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   753  740     <span class="k">push</span> <span class="i">@DataFieldsToOutput</span><span class="cm">,</span> <span class="i">@</span>{<span class="i">$OptionsInfo</span>{<span class="w">SpecifiedDatabaseDataFields</span>}}<span class="sc">;</span>
 | 
| 
 | 
   754  741     <span class="k">push</span> <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">SpecifiedDatabaseDataFields</span>}}<span class="cm">,</span> <span class="i">@</span>{<span class="i">$OptionsInfo</span>{<span class="w">SpecifiedDatabaseDataFields</span>}}<span class="sc">;</span>
 | 
| 
 | 
   755  742   <span class="s">}</span>
 | 
| 
 | 
   756  743 
 | 
| 
 | 
   757  744   <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataFieldsMode</span>} !~ <span class="q">/^CompoundID$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   758  745     <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputDataFields</span>} = <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
   759  746   <span class="s">}</span>
 | 
| 
 | 
   760  747 
 | 
| 
 | 
   761  748   <span class="k">push</span> <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataFieldsToOutput</span>}}<span class="cm">,</span> <span class="i">@DataFieldsToOutput</span><span class="sc">;</span>
 | 
| 
 | 
   762  749 
 | 
| 
 | 
   763  750 <span class="s">}</span>
 | 
| 
 | 
   764  751 
 | 
| 
 | 
   765  752 <span class="c"># Retrieve database fingerprints data columns information...</span>
 | 
| 
 | 
   766  753 <span class="c">#</span>
 | 
| 
 | 
   767 <a name="RetrieveDatabaseFingerprintsDataColsInfo-"></a> 754 <span class="k">sub </span><span class="m">RetrieveDatabaseFingerprintsDataColsInfo</span> <span class="s">{</span>
 | 
| 
 | 
   768  755   <span class="k">my</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="cm">,</span> <span class="i">$FileType</span><span class="cm">,</span> <span class="i">$InDelim</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   769  756   <span class="k">my</span><span class="s">(</span><span class="i">$Line</span><span class="cm">,</span> <span class="i">$ColNum</span><span class="cm">,</span> <span class="i">$ColLabel</span><span class="cm">,</span> <span class="i">$NumOfCols</span><span class="cm">,</span> <span class="i">@DataColLabels</span><span class="cm">,</span> <span class="i">@DataColLabelsToOutput</span><span class="cm">,</span> <span class="i">@DataColNumsToOutput</span><span class="cm">,</span> <span class="i">%DataColLabelToNumMap</span><span class="cm">,</span> <span class="i">%DataColNumToLabelMap</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   770  757 
 | 
| 
 | 
   771  758   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputDataCols</span>} = <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
   772  759 
 | 
| 
 | 
   773  760   <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColLabels</span>}} = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   774  761   <span class="i">%</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColLabelToNumMap</span>}} = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   775  762   <span class="i">%</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColNumToLabelMap</span>}} = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   776  763 
 | 
| 
 | 
   777  764   <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColNumsToOutput</span>}} = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   778  765   <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColLabelsToOutput</span>}} = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   779  766 
 | 
| 
 | 
   780  767   <span class="k">if</span> <span class="s">(</span><span class="i">$FileType</span> !~ <span class="q">/^Text$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   781  768     <span class="k">return</span><span class="sc">;</span>
 | 
| 
 | 
   782  769   <span class="s">}</span>
 | 
| 
 | 
   783  770 
 | 
| 
 | 
   784  771   <span class="i">@DataColLabels</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   785  772   <span class="i">@DataColLabelsToOutput</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   786  773   <span class="i">@DataColNumsToOutput</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   787  774 
 | 
| 
 | 
   788  775   <span class="i">%DataColLabelToNumMap</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   789  776   <span class="i">%DataColNumToLabelMap</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   790  777 
 | 
| 
 | 
   791  778   <span class="c"># Get column label line...</span>
 | 
| 
 | 
   792  779   <span class="k">open</span> <span class="w">TEXTFILE</span><span class="cm">,</span> <span class="q">"$FingerprintsFile"</span> <span class="k">or</span> <span class="k">die</span> <span class="q">"Error: Couldn't open $FingerprintsFile: $! \n"</span><span class="sc">;</span>
 | 
| 
 | 
   793  780   <span class="i">$Line</span> = <span class="i">TextUtil::GetTextLine</span><span class="s">(</span>\<span class="i">*TEXTFILE</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   794  781   <span class="k">close</span> <span class="w">TEXTFILE</span><span class="sc">;</span>
 | 
| 
 | 
   795  782 
 | 
| 
 | 
   796  783   <span class="i">$InDelim</span> = <span class="s">(</span><span class="i">$InDelim</span> =~ <span class="q">/^Tab$/i</span><span class="s">)</span> ? <span class="q">"\t"</span> <span class="co">:</span> <span class="s">(</span><span class="i">$InDelim</span> =~ <span class="q">/semicolon/i</span> ? <span class="q">"\;"</span> <span class="co">:</span> <span class="q">"\,"</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   797  784 
 | 
| 
 | 
   798  785   <span class="i">@DataColLabels</span> = <span class="i">TextUtil::SplitWords</span><span class="s">(</span><span class="i">$Line</span><span class="cm">,</span> <span class="i">$InDelim</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   799  786   <span class="i">$NumOfCols</span> = <span class="k">scalar</span> <span class="i">@DataColLabels</span><span class="sc">;</span>
 | 
| 
 | 
   800  787 
 | 
| 
 | 
   801  788   <span class="k">for</span> <span class="i">$ColNum</span> <span class="s">(</span><span class="n">0</span> .. <span class="i">$#DataColLabels</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   802  789     <span class="i">$ColLabel</span> = <span class="i">$DataColLabels</span>[<span class="i">$ColNum</span>]<span class="sc">;</span>
 | 
| 
 | 
   803  790     <span class="i">$DataColLabelToNumMap</span>{<span class="i">$ColLabel</span>} = <span class="i">$ColNum</span><span class="sc">;</span>
 | 
| 
 | 
   804  791     <span class="i">$DataColNumToLabelMap</span>{<span class="i">$ColNum</span>} = <span class="i">$ColLabel</span><span class="sc">;</span>
 | 
| 
 | 
   805  792   <span class="s">}</span>
 | 
| 
 | 
   806  793 
 | 
| 
 | 
   807  794   <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataColsMode</span>} =~ <span class="q">/^Specify$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   808  795     <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">DatabaseColMode</span>} =~ <span class="q">/^ColNum$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   809  796       <span class="k">for</span> <span class="i">$ColNum</span> <span class="s">(</span><span class="i">@</span>{<span class="i">$OptionsInfo</span>{<span class="w">SpecifiedDatabaseDataCols</span>}}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   810  797         <span class="k">if</span> <span class="s">(</span><span class="i">$ColNum</span> > <span class="i">$NumOfCols</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   811  798           <span class="k">die</span> <span class="q">"Error: Column number, $ColNum, specified using \"--DatabaseDataCols\" is not valid: It must be <= $NumOfCols\n"</span><span class="sc">;</span>
 | 
| 
 | 
   812  799         <span class="s">}</span>
 | 
| 
 | 
   813  800         <span class="k">push</span> <span class="i">@DataColNumsToOutput</span><span class="cm">,</span> <span class="s">(</span><span class="i">$ColNum</span> - <span class="n">1</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   814  801       <span class="s">}</span>
 | 
| 
 | 
   815  802     <span class="s">}</span>
 | 
| 
 | 
   816  803     <span class="k">elsif</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">DatabaseColMode</span>} =~ <span class="q">/^ColLabel$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   817  804       <span class="k">for</span> <span class="i">$ColLabel</span> <span class="s">(</span><span class="i">@</span>{<span class="i">$OptionsInfo</span>{<span class="w">SpecifiedDatabaseDataCols</span>}}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   818  805         <span class="k">if</span> <span class="s">(</span>!<span class="k">exists</span> <span class="i">$DataColLabelToNumMap</span>{<span class="i">$ColLabel</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   819  806           <span class="k">die</span> <span class="q">"Error: Column label, $ColLabel, specified using \"--DatabaseDataCols\" is not valid: It doesn't exist\n"</span><span class="sc">;</span>
 | 
| 
 | 
   820  807         <span class="s">}</span>
 | 
| 
 | 
   821  808         <span class="k">push</span> <span class="i">@DataColNumsToOutput</span><span class="cm">,</span> <span class="i">$DataColLabelToNumMap</span>{<span class="i">$ColLabel</span>}<span class="sc">;</span>
 | 
| 
 | 
   822  809       <span class="s">}</span>
 | 
| 
 | 
   823  810     <span class="s">}</span>
 | 
| 
 | 
   824  811   <span class="s">}</span>
 | 
| 
 | 
   825  812   <span class="k">elsif</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataColsMode</span>} =~ <span class="q">/^All$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   826  813     <span class="i">@DataColNumsToOutput</span> = <span class="k">map</span> <span class="s">{</span> <span class="i">$_</span> <span class="s">}</span> <span class="s">(</span><span class="n">0</span> .. <span class="i">$#DataColLabels</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   827  814   <span class="s">}</span>
 | 
| 
 | 
   828  815 
 | 
| 
 | 
   829  816   <span class="c"># Setup data column labels to output...</span>
 | 
| 
 | 
   830  817   <span class="k">if</span> <span class="s">(</span><span class="k">scalar</span> <span class="i">@DataColNumsToOutput</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   831  818     <span class="i">@DataColLabelsToOutput</span> = <span class="k">map</span> <span class="s">{</span> <span class="i">$DataColNumToLabelMap</span>{<span class="i">$_</span>} <span class="s">}</span> <span class="s">(</span><span class="n">0</span> .. <span class="i">$#DataColNumsToOutput</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   832  819   <span class="s">}</span>
 | 
| 
 | 
   833  820 
 | 
| 
 | 
   834  821   <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">OutputDataCols</span>} = <span class="k">scalar</span> <span class="i">@DataColNumsToOutput</span> ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
   835  822 
 | 
| 
 | 
   836  823   <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColLabels</span>}} = <span class="i">@DataColLabels</span><span class="sc">;</span>
 | 
| 
 | 
   837  824   <span class="i">%</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColLabelToNumMap</span>}} = <span class="i">%DataColLabelToNumMap</span><span class="sc">;</span>
 | 
| 
 | 
   838  825   <span class="i">%</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColNumToLabelMap</span>}} = <span class="i">%DataColNumToLabelMap</span><span class="sc">;</span>
 | 
| 
 | 
   839  826 
 | 
| 
 | 
   840  827   <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColNumsToOutput</span>}} = <span class="i">@DataColNumsToOutput</span><span class="sc">;</span>
 | 
| 
 | 
   841  828   <span class="i">@</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">DataColLabelsToOutput</span>}} = <span class="i">@DataColLabelsToOutput</span><span class="sc">;</span>
 | 
| 
 | 
   842  829 <span class="s">}</span>
 | 
| 
 | 
   843  830 
 | 
| 
 | 
   844  831 <span class="c"># Set maximum number of similar compounds to find for individual reference of set of multiple</span>
 | 
| 
 | 
   845  832 <span class="c"># reference compounds...</span>
 | 
| 
 | 
   846  833 <span class="c">#</span>
 | 
| 
 | 
   847 <a name="SetMaximumSimilarMoleculesToRetrieve-"></a> 834 <span class="k">sub </span><span class="m">SetMaximumSimilarMoleculesToRetrieve</span> <span class="s">{</span>
 | 
| 
 | 
   848  835   <span class="k">my</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="cm">,</span> <span class="i">$FileType</span><span class="cm">,</span> <span class="i">$InDelim</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   849  836   <span class="k">my</span><span class="s">(</span><span class="i">$MaxSimilarMolecules</span><span class="cm">,</span> <span class="i">$NumOfDatabaseMolecules</span><span class="cm">,</span> <span class="i">$PercentSimilarMolecules</span><span class="cm">,</span> <span class="i">$Line</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   850  837 
 | 
| 
 | 
   851  838   <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">SimilarCountMode</span>} !~ <span class="q">/^PercentSimilar$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   852  839     <span class="k">return</span><span class="sc">;</span>
 | 
| 
 | 
   853  840   <span class="s">}</span>
 | 
| 
 | 
   854  841 
 | 
| 
 | 
   855  842   <span class="i">$PercentSimilarMolecules</span> = <span class="i">$OptionsInfo</span>{<span class="w">PercentSimilarMolecules</span>}<span class="sc">;</span>
 | 
| 
 | 
   856  843 
 | 
| 
 | 
   857  844   <span class="c"># Count database entries to figure out MaxSimilarMolecules using PercentSimilarMolecules</span>
 | 
| 
 | 
   858  845   <span class="c"># value...</span>
 | 
| 
 | 
   859  846   <span class="i">$NumOfDatabaseMolecules</span> = <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
   860  847   <span class="k">if</span> <span class="s">(</span><span class="i">$FileType</span> =~ <span class="q">/^SD$/i</span> && <span class="k">exists</span><span class="s">(</span><span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">NumOfDatabaseMolecules</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   861  848     <span class="c"># It might already be counted for SD file...</span>
 | 
| 
 | 
   862  849     <span class="i">$NumOfDatabaseMolecules</span> = <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">NumOfDatabaseMolecules</span>}<span class="sc">;</span>
 | 
| 
 | 
   863  850   <span class="s">}</span>
 | 
| 
 | 
   864  851   <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
   865  852     <span class="k">print</span> <span class="q">"Calculating maximum number of similar molecules to retrieve for \"PercentSimilar\" value of \"--SimilarCountMode\" option by counting number of molecules in database fingerprints file...\n"</span><span class="sc">;</span>
 | 
| 
 | 
   866  853     <span class="k">open</span> <span class="w">FINGERPRINTSFILE</span><span class="cm">,</span> <span class="q">"$FingerprintsFile"</span> <span class="k">or</span> <span class="k">die</span> <span class="q">"Error: Couldn't open $FingerprintsFile: $! \n"</span><span class="sc">;</span>
 | 
| 
 | 
   867  854     <span class="j">FILETYPE:</span> <span class="s">{</span>
 | 
| 
 | 
   868  855       <span class="k">if</span> <span class="s">(</span><span class="i">$FileType</span> =~ <span class="q">/^SD$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   869  856         <span class="k">while</span> <span class="s">(</span><span class="i">$Line</span> = <span class="i">TextUtil::GetTextLine</span><span class="s">(</span>\<span class="i">*FINGERPRINTSFILE</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   870  857           <span class="k">if</span> <span class="s">(</span><span class="i">$Line</span> =~ <span class="q">/^\$\$\$\$/</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   871  858             <span class="i">$NumOfDatabaseMolecules</span>++<span class="sc">;</span>
 | 
| 
 | 
   872  859           <span class="s">}</span>
 | 
| 
 | 
   873  860         <span class="s">}</span>
 | 
| 
 | 
   874  861         <span class="k">last</span> <span class="j">FILETYPE</span><span class="sc">;</span>
 | 
| 
 | 
   875  862       <span class="s">}</span>
 | 
| 
 | 
   876  863       <span class="k">if</span> <span class="s">(</span><span class="i">$FileType</span> =~ <span class="q">/^Text$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   877  864         <span class="c"># Ignore column label line...</span>
 | 
| 
 | 
   878  865         <span class="i">$Line</span> = <span class="i">TextUtil::GetTextLine</span><span class="s">(</span>\<span class="i">*FINGERPRINTSFILE</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   879  866         <span class="k">while</span> <span class="s">(</span><span class="i">$Line</span> = <span class="i">TextUtil::GetTextLine</span><span class="s">(</span>\<span class="i">*FINGERPRINTSFILE</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   880  867           <span class="i">$NumOfDatabaseMolecules</span>++<span class="sc">;</span>
 | 
| 
 | 
   881  868         <span class="s">}</span>
 | 
| 
 | 
   882  869         <span class="k">last</span> <span class="j">FILETYPE</span><span class="sc">;</span>
 | 
| 
 | 
   883  870       <span class="s">}</span>
 | 
| 
 | 
   884  871       <span class="k">if</span> <span class="s">(</span><span class="i">$FileType</span> =~ <span class="q">/^FP$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   885  872         <span class="k">while</span> <span class="s">(</span><span class="i">$Line</span> = <span class="i">TextUtil::GetTextLine</span><span class="s">(</span>\<span class="i">*FINGERPRINTSFILE</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   886  873           <span class="k">if</span> <span class="s">(</span><span class="i">$Line</span> !~ <span class="q">/^#/</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   887  874             <span class="i">$NumOfDatabaseMolecules</span>++<span class="sc">;</span>
 | 
| 
 | 
   888  875           <span class="s">}</span>
 | 
| 
 | 
   889  876         <span class="s">}</span>
 | 
| 
 | 
   890  877         <span class="k">last</span> <span class="j">FILETYPE</span><span class="sc">;</span>
 | 
| 
 | 
   891  878       <span class="s">}</span>
 | 
| 
 | 
   892  879       <span class="i">$NumOfDatabaseMolecules</span> = <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
   893  880     <span class="s">}</span>
 | 
| 
 | 
   894  881     <span class="k">close</span> <span class="w">FINGERPRINTSFILE</span><span class="sc">;</span>
 | 
| 
 | 
   895  882     <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">NumOfDatabaseMolecules</span>} = <span class="i">$NumOfDatabaseMolecules</span><span class="sc">;</span>
 | 
| 
 | 
   896  883   <span class="s">}</span>
 | 
| 
 | 
   897  884 
 | 
| 
 | 
   898  885   <span class="i">$MaxSimilarMolecules</span> = <span class="k">int</span> <span class="s">(</span><span class="s">(</span><span class="i">$NumOfDatabaseMolecules</span> * <span class="i">$PercentSimilarMolecules</span><span class="s">)</span>/<span class="n">100</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   899  886   <span class="k">if</span> <span class="s">(</span><span class="i">$MaxSimilarMolecules</span> < <span class="n">1</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   900  887     <span class="i">$MaxSimilarMolecules</span> = <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
   901  888   <span class="s">}</span>
 | 
| 
 | 
   902  889 
 | 
| 
 | 
   903  890   <span class="i">$OptionsInfo</span>{<span class="w">MaxSimilarMolecules</span>} = <span class="i">$MaxSimilarMolecules</span><span class="sc">;</span>
 | 
| 
 | 
   904  891 <span class="s">}</span>
 | 
| 
 | 
   905  892 
 | 
| 
 | 
   906  893 <span class="c"># Retrieve information about fingerprints file...</span>
 | 
| 
 | 
   907  894 <span class="c">#</span>
 | 
| 
 | 
   908 <a name="RetrieveFingerprintsFileInfo-"></a> 895 <span class="k">sub </span><span class="m">RetrieveFingerprintsFileInfo</span> <span class="s">{</span>
 | 
| 
 | 
   909  896   <span class="k">my</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   910  897   <span class="k">my</span><span class="s">(</span><span class="i">$FileType</span><span class="cm">,</span> <span class="i">$InDelim</span><span class="cm">,</span> <span class="i">$FileDir</span><span class="cm">,</span> <span class="i">$FileExt</span><span class="cm">,</span> <span class="i">$FileName</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   911  898 
 | 
| 
 | 
   912  899   <span class="k">if</span> <span class="s">(</span>!<span class="s">(</span><span class="k">-e</span> <span class="i">$FingerprintsFile</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   913  900     <span class="k">die</span> <span class="q">"Error: Input fingerprints file, $FingerprintsFile, doesn't exist.\n"</span><span class="sc">;</span>
 | 
| 
 | 
   914  901   <span class="s">}</span>
 | 
| 
 | 
   915  902 
 | 
| 
 | 
   916  903   <span class="i">$FileType</span> = <span class="i">Fingerprints::FingerprintsFileUtil::GetFingerprintsFileType</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   917  904   <span class="k">if</span> <span class="s">(</span><span class="i">IsEmpty</span><span class="s">(</span><span class="i">$FileType</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   918  905     <span class="k">die</span> <span class="q">"Error: Input file, $FingerprintsFile, is not a fingerprints file.\n"</span><span class="sc">;</span>
 | 
| 
 | 
   919  906   <span class="s">}</span>
 | 
| 
 | 
   920  907 
 | 
| 
 | 
   921  908   <span class="i">$InDelim</span> = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
   922  909   <span class="k">if</span> <span class="s">(</span><span class="i">$FileType</span> =~ <span class="q">/^Text$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   923  910     <span class="i">$FileDir</span> = <span class="q">""</span><span class="sc">;</span> <span class="i">$FileName</span> = <span class="q">""</span><span class="sc">;</span> <span class="i">$FileExt</span> = <span class="q">""</span><span class="sc">;</span>
 | 
| 
 | 
   924  911     <span class="s">(</span><span class="i">$FileDir</span><span class="cm">,</span> <span class="i">$FileName</span><span class="cm">,</span> <span class="i">$FileExt</span><span class="s">)</span> = <span class="i">ParseFileName</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   925  912     <span class="i">$InDelim</span> = <span class="s">(</span><span class="i">$FileExt</span> =~ <span class="q">/^tsv$/i</span><span class="s">)</span> ? <span class="q">'Tab'</span> <span class="co">:</span> <span class="i">$OptionsInfo</span>{<span class="w">InDelim</span>}<span class="sc">;</span>
 | 
| 
 | 
   926  913   <span class="s">}</span>
 | 
| 
 | 
   927  914 
 | 
| 
 | 
   928  915   <span class="k">return</span> <span class="s">(</span><span class="i">$FileType</span><span class="cm">,</span> <span class="i">$InDelim</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   929  916 <span class="s">}</span>
 | 
| 
 | 
   930  917 
 | 
| 
 | 
   931  918 <span class="c"># Retrieve fingerprints file IO parameters...</span>
 | 
| 
 | 
   932  919 <span class="c">#</span>
 | 
| 
 | 
   933 <a name="RetrieveFingerprintsFileIOParameters-"></a> 920 <span class="k">sub </span><span class="m">RetrieveFingerprintsFileIOParameters</span> <span class="s">{</span>
 | 
| 
 | 
   934  921   <span class="k">my</span><span class="s">(</span><span class="i">$FingerprintsFileMode</span><span class="cm">,</span> <span class="i">$FileType</span><span class="cm">,</span> <span class="i">$FingerprintsFile</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   935  922   <span class="k">my</span><span class="s">(</span><span class="i">%FingerprintsFileIOParams</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   936  923 
 | 
| 
 | 
   937  924   <span class="k">if</span> <span class="s">(</span><span class="i">$FingerprintsFileMode</span> !~ <span class="q">/^(Reference|Database)$/</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   938  925     <span class="k">die</span> <span class="q">"Error: Unknown fingerprints file mode: $FingerprintsFileMode. Supported values: Reference or Database\n"</span><span class="sc">;</span>
 | 
| 
 | 
   939  926   <span class="s">}</span>
 | 
| 
 | 
   940  927 
 | 
| 
 | 
   941  928   <span class="i">%FingerprintsFileIOParams</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   942  929 
 | 
| 
 | 
   943  930   <span class="j">FILETYPE:</span> <span class="s">{</span>
 | 
| 
 | 
   944  931     <span class="k">if</span> <span class="s">(</span><span class="i">$FileType</span> =~ <span class="q">/^SD$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   945  932       <span class="i">%FingerprintsFileIOParams</span> = <span class="s">(</span><span class="q">'Name'</span> <span class="cm">=></span> <span class="i">$FingerprintsFile</span><span class="cm">,</span> <span class="q">'Mode'</span> <span class="cm">=></span> <span class="q">'Read'</span><span class="cm">,</span> <span class="q">'FingerprintsStringMode'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="w">FingerprintsMode</span>}<span class="cm">,</span> <span class="q">'ValidateData'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="w">ValidateData</span>}<span class="cm">,</span> <span class="q">'DetailLevel'</span> <span class="cm">=></span>  <span class="i">$OptionsInfo</span>{<span class="w">Detail</span>}<span class="cm">,</span> <span class="q">'FingerprintsFieldLabel'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="q">"${FingerprintsFileMode}FingerprintsField"</span>}<span class="cm">,</span> <span class="q">'CompoundIDMode'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="q">"${FingerprintsFileMode}CompoundIDMode"</span>}<span class="cm">,</span> <span class="q">'CompoundIDFieldLabel'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="q">"${FingerprintsFileMode}CompoundIDField"</span>}<span class="cm">,</span> <span class="q">'CompoundIDPrefix'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="q">"${FingerprintsFileMode}CompoundIDPrefix"</span>}<span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   946  933       <span class="k">last</span> <span class="j">FILETYPE</span><span class="sc">;</span>
 | 
| 
 | 
   947  934     <span class="s">}</span>
 | 
| 
 | 
   948  935     <span class="k">if</span> <span class="s">(</span><span class="i">$FileType</span> =~ <span class="q">/^FP$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   949  936       <span class="i">%FingerprintsFileIOParams</span> = <span class="s">(</span><span class="q">'Name'</span> <span class="cm">=></span> <span class="i">$FingerprintsFile</span><span class="cm">,</span> <span class="q">'Mode'</span> <span class="cm">=></span> <span class="q">'Read'</span><span class="cm">,</span> <span class="q">'FingerprintsStringMode'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="w">FingerprintsMode</span>}<span class="cm">,</span> <span class="q">'ValidateData'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="w">ValidateData</span>}<span class="cm">,</span> <span class="q">'DetailLevel'</span> <span class="cm">=></span>  <span class="i">$OptionsInfo</span>{<span class="w">Detail</span>}<span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   950  937       <span class="k">last</span> <span class="j">FILETYPE</span><span class="sc">;</span>
 | 
| 
 | 
   951  938     <span class="s">}</span>
 | 
| 
 | 
   952  939     <span class="k">if</span> <span class="s">(</span><span class="i">$FileType</span> =~ <span class="q">/^Text$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   953  940       <span class="i">%FingerprintsFileIOParams</span> = <span class="s">(</span><span class="q">'Name'</span> <span class="cm">=></span> <span class="i">$FingerprintsFile</span><span class="cm">,</span> <span class="q">'Mode'</span> <span class="cm">=></span> <span class="q">'Read'</span><span class="cm">,</span> <span class="q">'FingerprintsStringMode'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="w">FingerprintsMode</span>}<span class="cm">,</span> <span class="q">'ValidateData'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="w">ValidateData</span>}<span class="cm">,</span> <span class="q">'DetailLevel'</span> <span class="cm">=></span>  <span class="i">$OptionsInfo</span>{<span class="w">Detail</span>}<span class="cm">,</span> <span class="q">'FingerprintsCol'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="q">"${FingerprintsFileMode}FingerprintsCol"</span>}<span class="cm">,</span> <span class="q">'ColMode'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="q">"${FingerprintsFileMode}ColMode"</span>}<span class="cm">,</span> <span class="q">'CompoundIDCol'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="q">"${FingerprintsFileMode}CompoundIDCol"</span>}<span class="cm">,</span> <span class="q">'CompoundIDPrefix'</span> <span class="cm">=></span> <span class="i">$OptionsInfo</span>{<span class="q">"${FingerprintsFileMode}CompoundIDPrefix"</span>}<span class="cm">,</span> <span class="q">'InDelim'</span> <span class="cm">=></span> <span class="i">$FingerprintsFilesInfo</span>{<span class="i">$FingerprintsFileMode</span>}{<span class="w">InDelim</span>}<span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   954  941       <span class="k">last</span> <span class="j">FILETYPE</span><span class="sc">;</span>
 | 
| 
 | 
   955  942     <span class="s">}</span>
 | 
| 
 | 
   956  943     <span class="k">die</span> <span class="q">"Error: Fingerprints file type, $FileType, is not valid. Supported file types: SD, FP or Text\n"</span><span class="sc">;</span>
 | 
| 
 | 
   957  944   <span class="s">}</span>
 | 
| 
 | 
   958  945 
 | 
| 
 | 
   959  946   <span class="k">return</span> <span class="i">%FingerprintsFileIOParams</span><span class="sc">;</span>
 | 
| 
 | 
   960  947 <span class="s">}</span>
 | 
| 
 | 
   961  948 
 | 
| 
 | 
   962  949 <span class="c"># Make sure fingerprints data file contains valid dta and retrieve fingerprints string mode information...</span>
 | 
| 
 | 
   963  950 <span class="c">#</span>
 | 
| 
 | 
   964 <a name="RetrieveFingerprintsFileFingerprintsStringInfo-"></a> 951 <span class="k">sub </span><span class="m">RetrieveFingerprintsFileFingerprintsStringInfo</span> <span class="s">{</span>
 | 
| 
 | 
   965  952   <span class="k">my</span><span class="s">(</span><span class="i">$FingerprintsFileMode</span><span class="cm">,</span> <span class="i">$FingerprintsFile</span><span class="s">)</span> = <span class="i">@_</span><span class="sc">;</span>
 | 
| 
 | 
   966  953   <span class="k">my</span><span class="s">(</span><span class="i">$FingerprintsFileIO</span><span class="cm">,</span> <span class="i">$FingerprintsStringMode</span><span class="cm">,</span> <span class="i">$FingerprintsBitVectorStringMode</span><span class="cm">,</span> <span class="i">$FingerprintsVectorStringMode</span><span class="cm">,</span> <span class="i">$FirstFingerprintsStringType</span><span class="cm">,</span> <span class="i">$FirstFingerprintsStringDescription</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   967  954 
 | 
| 
 | 
   968  955   <span class="i">$FingerprintsFileIO</span> = <span class="i">Fingerprints::FingerprintsFileUtil::NewFingerprintsFileIO</span><span class="s">(</span><span class="i">%</span>{<span class="i">$FingerprintsFilesInfo</span>{<span class="i">$FingerprintsFileMode</span>}{<span class="w">FingerprintsFileIOParameters</span>}}<span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   969  956   <span class="k">if</span> <span class="s">(</span>!<span class="i">$FingerprintsFileIO</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   970  957     <span class="k">die</span> <span class="q">"Error: Reference fingerprints file, $FingerprintsFile, contains invalid fingerprints data.\n"</span><span class="sc">;</span>
 | 
| 
 | 
   971  958   <span class="s">}</span>
 | 
| 
 | 
   972  959   <span class="k">if</span> <span class="s">(</span>!<span class="i">$FingerprintsFileIO</span><span class="i">->IsFingerprintsFileDataValid</span><span class="s">(</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
   973  960     <span class="k">die</span> <span class="q">"Error: Reference fingerprints file, $FingerprintsFile, contains invalid fingerprints data.\n"</span><span class="sc">;</span>
 | 
| 
 | 
   974  961   <span class="s">}</span>
 | 
| 
 | 
   975  962 
 | 
| 
 | 
   976  963   <span class="i">$FingerprintsStringMode</span> = <span class="i">$FingerprintsFileIO</span><span class="i">->GetFingerprintsStringMode</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   977  964   <span class="i">$FingerprintsBitVectorStringMode</span> = <span class="i">$FingerprintsFileIO</span><span class="i">->GetFingerprintsBitVectorStringMode</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   978  965   <span class="i">$FingerprintsVectorStringMode</span> = <span class="i">$FingerprintsFileIO</span><span class="i">->GetFingerprintsVectorStringMode</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   979  966 
 | 
| 
 | 
   980  967   <span class="i">$FirstFingerprintsStringType</span> = <span class="i">$FingerprintsFileIO</span><span class="i">->GetFirstFingerprintsStringType</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   981  968   <span class="i">$FirstFingerprintsStringDescription</span> = <span class="i">$FingerprintsFileIO</span><span class="i">->GetFirstFingerprintsStringDescription</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   982  969 
 | 
| 
 | 
   983  970   <span class="i">$FingerprintsFileIO</span><span class="i">->Close</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   984  971 
 | 
| 
 | 
   985  972   <span class="k">return</span> <span class="s">(</span><span class="i">$FingerprintsStringMode</span><span class="cm">,</span> <span class="i">$FingerprintsBitVectorStringMode</span><span class="cm">,</span> <span class="i">$FingerprintsVectorStringMode</span><span class="cm">,</span> <span class="i">$FirstFingerprintsStringType</span><span class="cm">,</span> <span class="i">$FirstFingerprintsStringDescription</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   986  973 <span class="s">}</span>
 | 
| 
 | 
   987  974 
 | 
| 
 | 
   988  975 <span class="c"># Retrieve output files names using reference fingerprints file name...</span>
 | 
| 
 | 
   989  976 <span class="c">#</span>
 | 
| 
 | 
   990 <a name="RetrieveOutputFilesInfo-"></a> 977 <span class="k">sub </span><span class="m">RetrieveOutputFilesInfo</span> <span class="s">{</span>
 | 
| 
 | 
   991  978   <span class="k">my</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="cm">,</span> <span class="i">$FileDir</span><span class="cm">,</span> <span class="i">$FileExt</span><span class="cm">,</span> <span class="i">$FileName</span><span class="cm">,</span> <span class="i">$OutFileRoot</span><span class="cm">,</span> <span class="i">$SDOutFileName</span><span class="cm">,</span> <span class="i">$TextOutFileName</span><span class="cm">,</span> <span class="i">$SDOutFileExt</span><span class="cm">,</span> <span class="i">$TextOutFileExt</span><span class="cm">,</span> <span class="i">$ReferenceFileName</span><span class="cm">,</span> <span class="i">$DatabaseFileName</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
   992  979 
 | 
| 
 | 
   993  980   <span class="i">$OutputFilesInfo</span>{<span class="w">OutFileRoot</span>} = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
   994  981   <span class="i">$OutputFilesInfo</span>{<span class="w">SDOutFileName</span>} = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
   995  982   <span class="i">$OutputFilesInfo</span>{<span class="w">TextOutFileName</span>} = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
   996  983 
 | 
| 
 | 
   997  984   <span class="i">$FingerprintsFile</span> = <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FileName</span>}<span class="sc">;</span>
 | 
| 
 | 
   998  985 
 | 
| 
 | 
   999  986   <span class="i">$FileDir</span> = <span class="q">""</span><span class="sc">;</span> <span class="i">$FileName</span> = <span class="q">""</span><span class="sc">;</span> <span class="i">$FileExt</span> = <span class="q">""</span><span class="sc">;</span>
 | 
| 
 | 
  1000  987   <span class="s">(</span><span class="i">$FileDir</span><span class="cm">,</span> <span class="i">$FileName</span><span class="cm">,</span> <span class="i">$FileExt</span><span class="s">)</span> = <span class="i">ParseFileName</span><span class="s">(</span><span class="i">$FingerprintsFile</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1001  988 
 | 
| 
 | 
  1002  989   <span class="i">$SDOutFileExt</span> = <span class="q">"sdf"</span><span class="sc">;</span>
 | 
| 
 | 
  1003  990   <span class="i">$TextOutFileExt</span> = <span class="s">(</span><span class="i">$Options</span>{<span class="w">outdelim</span>} =~ <span class="q">/^tab$/i</span><span class="s">)</span> ? <span class="q">"tsv"</span> <span class="co">:</span> <span class="q">"csv"</span><span class="sc">;</span>
 | 
| 
 | 
  1004  991 
 | 
| 
 | 
  1005  992   <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">OutFileRoot</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1006  993     <span class="k">my</span> <span class="s">(</span><span class="i">$RootFileDir</span><span class="cm">,</span> <span class="i">$RootFileName</span><span class="cm">,</span> <span class="i">$RootFileExt</span><span class="s">)</span> = <span class="i">ParseFileName</span><span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">OutFileRoot</span>}<span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1007  994     <span class="k">if</span> <span class="s">(</span><span class="i">$RootFileName</span> && <span class="i">$RootFileExt</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1008  995       <span class="i">$FileName</span> = <span class="i">$RootFileName</span><span class="sc">;</span>
 | 
| 
 | 
  1009  996     <span class="s">}</span>
 | 
| 
 | 
  1010  997     <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
  1011  998       <span class="i">$FileName</span> = <span class="i">$OptionsInfo</span>{<span class="w">OutFileRoot</span>}<span class="sc">;</span>
 | 
| 
 | 
  1012  999     <span class="s">}</span>
 | 
| 
 | 
  1013 1000     <span class="i">$OutFileRoot</span> = <span class="i">$FileName</span><span class="sc">;</span>
 | 
| 
 | 
  1014 1001   <span class="s">}</span>
 | 
| 
 | 
  1015 1002   <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
  1016 1003     <span class="i">$OutFileRoot</span> = <span class="q">"${FileName}SimilaritySearching"</span><span class="sc">;</span>
 | 
| 
 | 
  1017 1004   <span class="s">}</span>
 | 
| 
 | 
  1018 1005 
 | 
| 
 | 
  1019 1006   <span class="i">$SDOutFileName</span> = <span class="q">"${OutFileRoot}.${SDOutFileExt}"</span><span class="sc">;</span>
 | 
| 
 | 
  1020 1007   <span class="i">$TextOutFileName</span> = <span class="q">"${OutFileRoot}.${TextOutFileExt}"</span><span class="sc">;</span>
 | 
| 
 | 
  1021 1008 
 | 
| 
 | 
  1022 1009   <span class="i">$ReferenceFileName</span> = <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Reference</span>}{<span class="w">FileName</span>}<span class="sc">;</span>
 | 
| 
 | 
  1023 1010   <span class="i">$DatabaseFileName</span> = <span class="i">$FingerprintsFilesInfo</span>{<span class="w">Database</span>}{<span class="w">FileName</span>}<span class="sc">;</span>
 | 
| 
 | 
  1024 1011 
 | 
| 
 | 
  1025 1012   <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">SDOutput</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1026 1013     <span class="k">if</span> <span class="s">(</span><span class="i">$SDOutFileName</span> =~ <span class="q">/^$ReferenceFileName$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1027 1014       <span class="k">die</span> <span class="q">"Error: Same output, $SDOutFileName, and reference input file names.\nSpecify a different name using \"-r --root\" option or use default name.\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1028 1015     <span class="s">}</span>
 | 
| 
 | 
  1029 1016     <span class="k">if</span> <span class="s">(</span><span class="i">$SDOutFileName</span> =~ <span class="q">/^$DatabaseFileName$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1030 1017       <span class="k">die</span> <span class="q">"Error: Same output, $SDOutFileName, and database input file names.\nSpecify a different name using \"-r --root\" option or use default name.\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1031 1018     <span class="s">}</span>
 | 
| 
 | 
  1032 1019   <span class="s">}</span>
 | 
| 
 | 
  1033 1020 
 | 
| 
 | 
  1034 1021   <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">TextOutput</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1035 1022     <span class="k">if</span> <span class="s">(</span><span class="i">$TextOutFileName</span> =~ <span class="q">/^$ReferenceFileName$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1036 1023       <span class="k">die</span> <span class="q">"Error: Same output, $TextOutFileName, and reference input file names.\nSpecify a different name using \"-r --root\" option or use default name.\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1037 1024     <span class="s">}</span>
 | 
| 
 | 
  1038 1025     <span class="k">if</span> <span class="s">(</span><span class="i">$TextOutFileName</span> =~ <span class="q">/^$DatabaseFileName$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1039 1026       <span class="k">die</span> <span class="q">"Error: Same output, $TextOutFileName, and database input file names.\nSpecify a different name using \"-r --root\" option or use default name.\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1040 1027     <span class="s">}</span>
 | 
| 
 | 
  1041 1028   <span class="s">}</span>
 | 
| 
 | 
  1042 1029 
 | 
| 
 | 
  1043 1030   <span class="k">if</span> <span class="s">(</span>!<span class="i">$OptionsInfo</span>{<span class="w">OverwriteFiles</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1044 1031     <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">SDOutput</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1045 1032       <span class="k">if</span> <span class="s">(</span><span class="k">-e</span> <span class="i">$SDOutFileName</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1046 1033         <span class="k">die</span> <span class="q">"Error: The output file $SDOutFileName already exists.\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1047 1034       <span class="s">}</span>
 | 
| 
 | 
  1048 1035     <span class="s">}</span>
 | 
| 
 | 
  1049 1036     <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">TextOutput</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1050 1037       <span class="k">if</span> <span class="s">(</span><span class="k">-e</span> <span class="i">$TextOutFileName</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1051 1038         <span class="k">die</span> <span class="q">"Error: The output file $TextOutFileName already exists.\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1052 1039       <span class="s">}</span>
 | 
| 
 | 
  1053 1040     <span class="s">}</span>
 | 
| 
 | 
  1054 1041   <span class="s">}</span>
 | 
| 
 | 
  1055 1042 
 | 
| 
 | 
  1056 1043   <span class="i">$OutputFilesInfo</span>{<span class="w">OutFileRoot</span>} = <span class="i">$OutFileRoot</span><span class="sc">;</span>
 | 
| 
 | 
  1057 1044   <span class="i">$OutputFilesInfo</span>{<span class="w">SDOutFileName</span>} = <span class="i">$SDOutFileName</span><span class="sc">;</span>
 | 
| 
 | 
  1058 1045   <span class="i">$OutputFilesInfo</span>{<span class="w">TextOutFileName</span>} = <span class="i">$TextOutFileName</span><span class="sc">;</span>
 | 
| 
 | 
  1059 1046 
 | 
| 
 | 
  1060 1047 <span class="s">}</span>
 | 
| 
 | 
  1061 1048 
 | 
| 
 | 
  1062 1049 <span class="c"># Process input fingerprints file names...</span>
 | 
| 
 | 
  1063 1050 <span class="c">#</span>
 | 
| 
 | 
  1064 <a name="ProcessFingerprintsFileNames-"></a>1051 <span class="k">sub </span><span class="m">ProcessFingerprintsFileNames</span> <span class="s">{</span>
 | 
| 
 | 
  1065 1052   <span class="i">@FingerprintsFilesList</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1066 1053 
 | 
| 
 | 
  1067 1054   <span class="k">if</span> <span class="s">(</span><span class="i">@ARGV</span> != <span class="n">2</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1068 1055     <span class="k">die</span> <span class="i">GetUsageFromPod</span><span class="s">(</span><span class="q">"$FindBin::Bin/$ScriptName"</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1069 1056   <span class="s">}</span>
 | 
| 
 | 
  1070 1057 
 | 
| 
 | 
  1071 1058   <span class="c"># Reference fingerprints file name...</span>
 | 
| 
 | 
  1072 1059   <span class="k">push</span> <span class="i">@FingerprintsFilesList</span><span class="cm">,</span> <span class="i">$ARGV</span>[<span class="n">0</span>]<span class="sc">;</span>
 | 
| 
 | 
  1073 1060 
 | 
| 
 | 
  1074 1061   <span class="c"># Database fingerprints file name...</span>
 | 
| 
 | 
  1075 1062   <span class="k">push</span> <span class="i">@FingerprintsFilesList</span><span class="cm">,</span> <span class="i">$ARGV</span>[<span class="n">1</span>]<span class="sc">;</span>
 | 
| 
 | 
  1076 1063 
 | 
| 
 | 
  1077 1064 <span class="s">}</span>
 | 
| 
 | 
  1078 1065 
 | 
| 
 | 
  1079 1066 <span class="c"># Process option values...</span>
 | 
| 
 | 
  1080 <a name="ProcessOptions-"></a>1067 <span class="k">sub </span><span class="m">ProcessOptions</span> <span class="s">{</span>
 | 
| 
 | 
  1081 1068   <span class="i">%OptionsInfo</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1082 1069 
 | 
| 
 | 
  1083 1070   <span class="i">$OptionsInfo</span>{<span class="w">Mode</span>} = <span class="i">$Options</span>{<span class="w">mode</span>}<span class="sc">;</span>
 | 
| 
 | 
  1084 1071   <span class="i">$OptionsInfo</span>{<span class="w">FingerprintsMode</span>} = <span class="i">$Options</span>{<span class="w">fingerprintsmode</span>}<span class="sc">;</span>
 | 
| 
 | 
  1085 1072 
 | 
| 
 | 
  1086 1073   <span class="i">$OptionsInfo</span>{<span class="w">SearchMode</span>} = <span class="i">$Options</span>{<span class="w">searchmode</span>}<span class="sc">;</span>
 | 
| 
 | 
  1087 1074 
 | 
| 
 | 
  1088 1075   <span class="i">ProcessBitVectorComparisonOptions</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1089 1076   <span class="i">ProcessVectorComparisonOptions</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1090 1077 
 | 
| 
 | 
  1091 1078   <span class="i">$OptionsInfo</span>{<span class="w">GroupFusionRule</span>} = <span class="i">$Options</span>{<span class="w">groupfusionrule</span>}<span class="sc">;</span>
 | 
| 
 | 
  1092 1079   <span class="i">$OptionsInfo</span>{<span class="w">GroupFusionApplyCutoff</span>} = <span class="s">(</span><span class="i">$Options</span>{<span class="w">groupfusionapplycutoff</span>} =~ <span class="q">/^Yes$/i</span><span class="s">)</span> ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span><span class="sc">;</span>
 | 
| 
 | 
  1093 1080 
 | 
| 
 | 
  1094 1081   <span class="i">$OptionsInfo</span>{<span class="w">SimilarCountMode</span>} = <span class="i">$Options</span>{<span class="w">similarcountmode</span>}<span class="sc">;</span>
 | 
| 
 | 
  1095 1082   <span class="i">$OptionsInfo</span>{<span class="w">NumOfSimilarMolecules</span>} = <span class="i">$Options</span>{<span class="w">numofsimilarmolecules</span>}<span class="sc">;</span>
 | 
| 
 | 
  1096 1083   <span class="i">$OptionsInfo</span>{<span class="w">PercentSimilarMolecules</span>} = <span class="i">$Options</span>{<span class="w">percentsimilarmolecules</span>}<span class="sc">;</span>
 | 
| 
 | 
  1097 1084 
 | 
| 
 | 
  1098 1085   <span class="c"># Set MaxSimilarMolecules to NumOfSimilarMolecules. For PercentSimilar value of SimilarCountMode,</span>
 | 
| 
 | 
  1099 1086   <span class="c"># it'll be overwritten using number of entries in database fingerprints file and value of PercentSimilarMolecules...</span>
 | 
| 
 | 
  1100 1087   <span class="c">#</span>
 | 
| 
 | 
  1101 1088   <span class="i">$OptionsInfo</span>{<span class="w">MaxSimilarMolecules</span>} = <span class="i">$OptionsInfo</span>{<span class="w">NumOfSimilarMolecules</span>}<span class="sc">;</span>
 | 
| 
 | 
  1102 1089 
 | 
| 
 | 
  1103 1090   <span class="i">$OptionsInfo</span>{<span class="w">SimilarityCutoff</span>} = <span class="i">$Options</span>{<span class="w">similaritycutoff</span>}<span class="sc">;</span>
 | 
| 
 | 
  1104 1091   <span class="i">$OptionsInfo</span>{<span class="w">DistanceCutoff</span>} = <span class="i">$Options</span>{<span class="w">distancecutoff</span>}<span class="sc">;</span>
 | 
| 
 | 
  1105 1092 
 | 
| 
 | 
  1106 1093   <span class="i">$OptionsInfo</span>{<span class="w">kNN</span>} = <span class="i">$Options</span>{<span class="w">knn</span>}<span class="sc">;</span>
 | 
| 
 | 
  1107 1094   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">knn</span>} !~ <span class="q">/^All$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1108 1095     <span class="k">if</span> <span class="s">(</span>!<span class="i">IsPositiveInteger</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">knn</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1109 1096       <span class="k">die</span> <span class="q">"Error: The value specified, $Options{knn}, for option \"-k, --KNN\" is not valid. Allowed values: > 0 \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1110 1097     <span class="s">}</span>
 | 
| 
 | 
  1111 1098   <span class="s">}</span>
 | 
| 
 | 
  1112 1099 
 | 
| 
 | 
  1113 1100   <span class="i">ProcessReferenceFingerprintsDataOptions</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1114 1101   <span class="i">ProcessDatabaseFingerprintsDataOptions</span><span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1115 1102 
 | 
| 
 | 
  1116 1103   <span class="i">$OptionsInfo</span>{<span class="w">Detail</span>} = <span class="i">$Options</span>{<span class="w">detail</span>}<span class="sc">;</span>
 | 
| 
 | 
  1117 1104 
 | 
| 
 | 
  1118 1105   <span class="i">$OptionsInfo</span>{<span class="w">InDelim</span>} = <span class="i">$Options</span>{<span class="w">indelim</span>}<span class="sc">;</span>
 | 
| 
 | 
  1119 1106   <span class="i">$OptionsInfo</span>{<span class="w">OutDelim</span>} = <span class="s">(</span><span class="i">$Options</span>{<span class="w">outdelim</span>} =~ <span class="q">/tab/i</span> <span class="s">)</span> ? <span class="q">"\t"</span> <span class="co">:</span> <span class="s">(</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">outdelim</span>} =~ <span class="q">/semicolon/i</span><span class="s">)</span> ? <span class="q">"\;"</span> <span class="co">:</span> <span class="q">"\,"</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1120 1107   <span class="i">$OptionsInfo</span>{<span class="w">OutQuote</span>} = <span class="s">(</span><span class="i">$Options</span>{<span class="w">quote</span>} =~ <span class="q">/^Yes$/i</span><span class="s">)</span> ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
  1121 1108 
 | 
| 
 | 
  1122 1109   <span class="i">$OptionsInfo</span>{<span class="w">Output</span>} = <span class="i">$Options</span>{<span class="w">output</span>}<span class="sc">;</span>
 | 
| 
 | 
  1123 1110   <span class="i">$OptionsInfo</span>{<span class="w">SDOutput</span>} = <span class="s">(</span><span class="i">$Options</span>{<span class="w">output</span>} =~ <span class="q">/^(SD|Both)$/i</span><span class="s">)</span> ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
  1124 1111   <span class="i">$OptionsInfo</span>{<span class="w">TextOutput</span>} = <span class="s">(</span><span class="i">$Options</span>{<span class="w">output</span>} =~ <span class="q">/^(Text|Both)$/i</span><span class="s">)</span> ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
  1125 1112 
 | 
| 
 | 
  1126 1113   <span class="i">$OptionsInfo</span>{<span class="w">OverwriteFiles</span>} = <span class="i">$Options</span>{<span class="w">overwrite</span>} ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
  1127 1114   <span class="i">$OptionsInfo</span>{<span class="w">OutFileRoot</span>} = <span class="i">$Options</span>{<span class="w">root</span>} ? <span class="i">$Options</span>{<span class="w">root</span>} <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
  1128 1115 
 | 
| 
 | 
  1129 1116   <span class="i">$OptionsInfo</span>{<span class="w">Fast</span>} = <span class="i">$Options</span>{<span class="w">fast</span>} ? <span class="n">1</span> <span class="co">:</span> <span class="n">0</span><span class="sc">;</span>
 | 
| 
 | 
  1130 1117   <span class="i">$OptionsInfo</span>{<span class="w">ValidateData</span>} = <span class="i">$Options</span>{<span class="w">fast</span>} ? <span class="n">0</span> <span class="co">:</span> <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
  1131 1118 
 | 
| 
 | 
  1132 1119   <span class="i">$OptionsInfo</span>{<span class="w">Precision</span>} = <span class="i">$Options</span>{<span class="w">precision</span>}<span class="sc">;</span>
 | 
| 
 | 
  1133 1120 <span class="s">}</span>
 | 
| 
 | 
  1134 1121 
 | 
| 
 | 
  1135 1122 <span class="c"># Process options related to comparion of bit vector strings...</span>
 | 
| 
 | 
  1136 1123 <span class="c">#</span>
 | 
| 
 | 
  1137 <a name="ProcessBitVectorComparisonOptions-"></a>1124 <span class="k">sub </span><span class="m">ProcessBitVectorComparisonOptions</span> <span class="s">{</span>
 | 
| 
 | 
  1138 1125   <span class="c"># Setup supported bit vector similarity coefficients for bit vector strings...</span>
 | 
| 
 | 
  1139 1126   <span class="k">my</span><span class="s">(</span><span class="i">$ComparisonMeasure</span><span class="cm">,</span> <span class="i">$SupportedComparisonMeasure</span><span class="cm">,</span> <span class="i">@SupportedComparisonMeasures</span><span class="cm">,</span> <span class="i">%SupportedComparisonMeasuresNameMap</span><span class="cm">,</span> <span class="i">%SupportedComparisonMeasuresMethodMap</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1140 1127 
 | 
| 
 | 
  1141 1128   <span class="i">@SupportedComparisonMeasures</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1142 1129   <span class="i">%SupportedComparisonMeasuresNameMap</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1143 1130   <span class="i">%SupportedComparisonMeasuresMethodMap</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1144 1131 
 | 
| 
 | 
  1145 1132   <span class="k">for</span> <span class="i">$SupportedComparisonMeasure</span> <span class="s">(</span><span class="i">Fingerprints::FingerprintsBitVector::GetSupportedSimilarityCoefficients</span><span class="s">(</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1146 1133     <span class="c"># Similarity coefficient function/method names contain "Coefficient" in their names.</span>
 | 
| 
 | 
  1147 1134     <span class="c"># So take 'em out and setup a map to original function/method name...</span>
 | 
| 
 | 
  1148 1135     <span class="i">$ComparisonMeasure</span> = <span class="i">$SupportedComparisonMeasure</span><span class="sc">;</span>
 | 
| 
 | 
  1149 1136     <span class="i">$ComparisonMeasure</span> =~ <span class="q">s/Coefficient$//</span><span class="sc">;</span>
 | 
| 
 | 
  1150 1137 
 | 
| 
 | 
  1151 1138     <span class="k">push</span> <span class="i">@SupportedComparisonMeasures</span><span class="cm">,</span> <span class="i">$ComparisonMeasure</span><span class="sc">;</span>
 | 
| 
 | 
  1152 1139     <span class="i">$SupportedComparisonMeasuresNameMap</span>{<span class="k">lc</span><span class="s">(</span><span class="i">$ComparisonMeasure</span><span class="s">)</span>} = <span class="i">$ComparisonMeasure</span><span class="sc">;</span>
 | 
| 
 | 
  1153 1140     <span class="i">$SupportedComparisonMeasuresMethodMap</span>{<span class="k">lc</span><span class="s">(</span><span class="i">$ComparisonMeasure</span><span class="s">)</span>} = <span class="i">$SupportedComparisonMeasure</span><span class="sc">;</span>
 | 
| 
 | 
  1154 1141   <span class="s">}</span>
 | 
| 
 | 
  1155 1142 
 | 
| 
 | 
  1156 1143   <span class="c"># Setup similarity coefficient to use for calculating similarity matrices for bit vector strings...</span>
 | 
| 
 | 
  1157 1144   <span class="k">my</span><span class="s">(</span><span class="i">$SpecifiedMeasure</span><span class="cm">,</span> <span class="i">$SpecifiedComparisonMeasureName</span><span class="cm">,</span> <span class="i">$SpecifiedComparisonMeasureMethod</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1158 1145 
 | 
| 
 | 
  1159 1146   <span class="i">$SpecifiedComparisonMeasureName</span> = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
  1160 1147   <span class="i">$SpecifiedComparisonMeasureMethod</span> = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
  1161 1148 
 | 
| 
 | 
  1162 1149   <span class="i">$SpecifiedMeasure</span> = <span class="i">$Options</span>{<span class="w">bitvectorcomparisonmode</span>}<span class="sc">;</span>
 | 
| 
 | 
  1163 1150 
 | 
| 
 | 
  1164 1151   <span class="k">if</span> <span class="s">(</span>! <span class="k">exists</span> <span class="i">$SupportedComparisonMeasuresMethodMap</span>{<span class="k">lc</span><span class="s">(</span><span class="i">$SpecifiedMeasure</span><span class="s">)</span>} <span class="s">)</span>  <span class="s">{</span>
 | 
| 
 | 
  1165 1152       <span class="k">die</span> <span class="q">"Error: The value specified, $SpecifiedMeasure, for option \"-b --BitVectorComparisonMode\" is not valid.\nAllowed values:"</span><span class="cm">,</span> <span class="i">JoinWords</span><span class="s">(</span>\<span class="i">@SupportedComparisonMeasures</span><span class="cm">,</span> <span class="q">", "</span><span class="cm">,</span> <span class="n">0</span><span class="s">)</span><span class="cm">,</span> <span class="q">"\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1166 1153   <span class="s">}</span>
 | 
| 
 | 
  1167 1154 
 | 
| 
 | 
  1168 1155   <span class="i">$SpecifiedComparisonMeasureMethod</span> = <span class="i">$SupportedComparisonMeasuresMethodMap</span>{<span class="k">lc</span><span class="s">(</span><span class="i">$SpecifiedMeasure</span><span class="s">)</span>}<span class="sc">;</span>
 | 
| 
 | 
  1169 1156   <span class="i">$SpecifiedComparisonMeasureName</span> = <span class="i">$SupportedComparisonMeasuresNameMap</span>{<span class="k">lc</span><span class="s">(</span><span class="i">$SpecifiedMeasure</span><span class="s">)</span>}<span class="sc">;</span>
 | 
| 
 | 
  1170 1157 
 | 
| 
 | 
  1171 1158   <span class="i">$OptionsInfo</span>{<span class="w">BitVectorComparisonMode</span>} = <span class="i">$Options</span>{<span class="w">bitvectorcomparisonmode</span>}<span class="sc">;</span>
 | 
| 
 | 
  1172 1159 
 | 
| 
 | 
  1173 1160   <span class="i">$OptionsInfo</span>{<span class="w">SpecifiedBitVectorComparisonMeasure</span>} = <span class="i">$SpecifiedMeasure</span><span class="sc">;</span>
 | 
| 
 | 
  1174 1161   <span class="i">$OptionsInfo</span>{<span class="w">SpecifiedBitVectorComparisonMeasureName</span>} = <span class="i">$SpecifiedComparisonMeasureName</span><span class="sc">;</span>
 | 
| 
 | 
  1175 1162   <span class="i">$OptionsInfo</span>{<span class="w">SpecifiedBitVectorComparisonMeasureMethod</span>} = <span class="i">$SpecifiedComparisonMeasureMethod</span><span class="sc">;</span>
 | 
| 
 | 
  1176 1163 
 | 
| 
 | 
  1177 1164   <span class="c"># Make sure valid alpha parameter is specified for Tversky calculation...</span>
 | 
| 
 | 
  1178 1165   <span class="i">$OptionsInfo</span>{<span class="w">Alpha</span>} = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
  1179 1166   <span class="k">if</span> <span class="s">(</span><span class="i">$SpecifiedMeasure</span> =~ <span class="q">/^(TverskySimilarity|WeightedTverskySimilarity)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1180 1167     <span class="k">if</span> <span class="s">(</span><span class="i">IsEmpty</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">alpha</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1181 1168       <span class="k">die</span> <span class="q">"Error: You must specify a value for \"-a, --alpha\" option in \"TverskySimilarity or WeightedTverskySimilarity\" \"-m --mode\". \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1182 1169     <span class="s">}</span>
 | 
| 
 | 
  1183 1170     <span class="k">my</span><span class="s">(</span><span class="i">$Alpha</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1184 1171     <span class="i">$Alpha</span> = <span class="i">$Options</span>{<span class="w">alpha</span>}<span class="sc">;</span>
 | 
| 
 | 
  1185 1172     <span class="k">if</span> <span class="s">(</span>!<span class="s">(</span><span class="i">IsFloat</span><span class="s">(</span><span class="i">$Alpha</span><span class="s">)</span> && <span class="i">$Alpha</span> >=<span class="n">0</span> && <span class="i">$Alpha</span> <= <span class="n">1</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1186 1173       <span class="k">die</span> <span class="q">"Error: The value specified, $Options{alpha}, for option \"-a, --alpha\" is not valid. Allowed values: >= 0 and <= 1\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1187 1174     <span class="s">}</span>
 | 
| 
 | 
  1188 1175     <span class="i">$OptionsInfo</span>{<span class="w">Alpha</span>} = <span class="i">$Alpha</span><span class="sc">;</span>
 | 
| 
 | 
  1189 1176   <span class="s">}</span>
 | 
| 
 | 
  1190 1177 
 | 
| 
 | 
  1191 1178   <span class="c"># Make sure valid beta parameter is specified for WeightedTanimoto and WeightedTversky</span>
 | 
| 
 | 
  1192 1179   <span class="c"># calculations...</span>
 | 
| 
 | 
  1193 1180   <span class="i">$OptionsInfo</span>{<span class="w">Beta</span>} = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
  1194 1181   <span class="k">if</span> <span class="s">(</span><span class="i">$SpecifiedMeasure</span> =~ <span class="q">/^(WeightedTverskySimilarity|WeightedTanimotoSimilarity)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1195 1182     <span class="k">if</span> <span class="s">(</span><span class="i">IsEmpty</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">beta</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1196 1183       <span class="k">die</span> <span class="q">"Error: You must specify a value for \"-b, --beta\" option in \"WeightedTverskySimilarity or WeightedTanimotoSimilarity\" \"-m --mode\". \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1197 1184     <span class="s">}</span>
 | 
| 
 | 
  1198 1185     <span class="k">my</span><span class="s">(</span><span class="i">$Beta</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1199 1186     <span class="i">$Beta</span> = <span class="i">$Options</span>{<span class="w">beta</span>}<span class="sc">;</span>
 | 
| 
 | 
  1200 1187     <span class="k">if</span> <span class="s">(</span>!<span class="s">(</span><span class="i">IsFloat</span><span class="s">(</span><span class="i">$Beta</span><span class="s">)</span> && <span class="i">$Beta</span> >=<span class="n">0</span> && <span class="i">$Beta</span> <= <span class="n">1</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1201 1188       <span class="k">die</span> <span class="q">"Error: The value specified, $Options{beta}, for option \"-b, --beta\" is not valid. Allowed values: >= 0 and <= 1\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1202 1189     <span class="s">}</span>
 | 
| 
 | 
  1203 1190     <span class="i">$OptionsInfo</span>{<span class="w">Beta</span>} = <span class="i">$Beta</span><span class="sc">;</span>
 | 
| 
 | 
  1204 1191   <span class="s">}</span>
 | 
| 
 | 
  1205 1192 <span class="s">}</span>
 | 
| 
 | 
  1206 1193 
 | 
| 
 | 
  1207 1194 <span class="c"># Process options related to comparion of vector strings...</span>
 | 
| 
 | 
  1208 1195 <span class="c">#</span>
 | 
| 
 | 
  1209 <a name="ProcessVectorComparisonOptions-"></a>1196 <span class="k">sub </span><span class="m">ProcessVectorComparisonOptions</span> <span class="s">{</span>
 | 
| 
 | 
  1210 1197   <span class="c"># Setup specified similarity coefficients for vector strings..</span>
 | 
| 
 | 
  1211 1198   <span class="k">my</span><span class="s">(</span><span class="i">$ComparisonMeasure</span><span class="cm">,</span> <span class="i">$SupportedComparisonMeasure</span><span class="cm">,</span> <span class="i">@SupportedComparisonMeasures</span><span class="cm">,</span> <span class="i">%SupportedComparisonMeasuresNameMap</span><span class="cm">,</span> <span class="i">%SupportedComparisonMeasuresMethodMap</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1212 1199 
 | 
| 
 | 
  1213 1200   <span class="i">@SupportedComparisonMeasures</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1214 1201   <span class="i">%SupportedComparisonMeasuresNameMap</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1215 1202   <span class="i">%SupportedComparisonMeasuresMethodMap</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1216 1203   <span class="k">for</span> <span class="i">$SupportedComparisonMeasure</span> <span class="s">(</span><span class="i">Fingerprints::FingerprintsVector::GetSupportedDistanceAndSimilarityCoefficients</span><span class="s">(</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1217 1204     <span class="c"># Similarity and distance coefficient function/method names contain "Coefficient" in their names.</span>
 | 
| 
 | 
  1218 1205     <span class="c"># So take 'em out and setup a map to original function/method name...</span>
 | 
| 
 | 
  1219 1206     <span class="i">$ComparisonMeasure</span> = <span class="i">$SupportedComparisonMeasure</span><span class="sc">;</span>
 | 
| 
 | 
  1220 1207     <span class="k">if</span> <span class="s">(</span><span class="i">$ComparisonMeasure</span> =~ <span class="q">/Coefficient$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1221 1208       <span class="i">$ComparisonMeasure</span> =~ <span class="q">s/Coefficient$//i</span><span class="sc">;</span>
 | 
| 
 | 
  1222 1209     <span class="s">}</span>
 | 
| 
 | 
  1223 1210     <span class="k">push</span> <span class="i">@SupportedComparisonMeasures</span><span class="cm">,</span> <span class="i">$ComparisonMeasure</span><span class="sc">;</span>
 | 
| 
 | 
  1224 1211     <span class="i">$SupportedComparisonMeasuresNameMap</span>{<span class="k">lc</span><span class="s">(</span><span class="i">$ComparisonMeasure</span><span class="s">)</span>} = <span class="i">$ComparisonMeasure</span><span class="sc">;</span>
 | 
| 
 | 
  1225 1212     <span class="i">$SupportedComparisonMeasuresMethodMap</span>{<span class="k">lc</span><span class="s">(</span><span class="i">$ComparisonMeasure</span><span class="s">)</span>} = <span class="i">$SupportedComparisonMeasure</span><span class="sc">;</span>
 | 
| 
 | 
  1226 1213   <span class="s">}</span>
 | 
| 
 | 
  1227 1214 
 | 
| 
 | 
  1228 1215   <span class="c"># Setup a list of similarity coefficients to use for calculating similarity matrices for bit vector strings...</span>
 | 
| 
 | 
  1229 1216   <span class="k">my</span><span class="s">(</span><span class="i">$SpecifiedMeasure</span><span class="cm">,</span> <span class="i">$SpecifiedComparisonMeasureName</span><span class="cm">,</span> <span class="i">$SpecifiedComparisonMeasureMethod</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1230 1217 
 | 
| 
 | 
  1231 1218   <span class="i">$SpecifiedComparisonMeasureName</span> = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
  1232 1219   <span class="i">$SpecifiedComparisonMeasureMethod</span> = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
  1233 1220 
 | 
| 
 | 
  1234 1221   <span class="i">$SpecifiedMeasure</span> = <span class="i">$Options</span>{<span class="w">vectorcomparisonmode</span>}<span class="sc">;</span>
 | 
| 
 | 
  1235 1222   <span class="i">$SpecifiedMeasure</span> =~ <span class="q">s/ //g</span><span class="sc">;</span>
 | 
| 
 | 
  1236 1223 
 | 
| 
 | 
  1237 1224   <span class="k">if</span> <span class="s">(</span>! <span class="k">exists</span><span class="s">(</span><span class="i">$SupportedComparisonMeasuresMethodMap</span>{<span class="k">lc</span><span class="s">(</span><span class="i">$SpecifiedMeasure</span><span class="s">)</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1238 1225     <span class="k">die</span> <span class="q">"Error: The value specified, $SpecifiedMeasure, for option \"-v --VectorComparisonMode\" is not valid.\nAllowed values:"</span><span class="cm">,</span> <span class="i">JoinWords</span><span class="s">(</span>\<span class="i">@SupportedComparisonMeasures</span><span class="cm">,</span> <span class="q">", "</span><span class="cm">,</span> <span class="n">0</span><span class="s">)</span><span class="cm">,</span> <span class="q">"\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1239 1226   <span class="s">}</span>
 | 
| 
 | 
  1240 1227 
 | 
| 
 | 
  1241 1228   <span class="i">$SpecifiedComparisonMeasureMethod</span> = <span class="i">$SupportedComparisonMeasuresMethodMap</span>{<span class="k">lc</span><span class="s">(</span><span class="i">$SpecifiedMeasure</span><span class="s">)</span>}<span class="sc">;</span>
 | 
| 
 | 
  1242 1229   <span class="i">$SpecifiedComparisonMeasureName</span> = <span class="i">$SupportedComparisonMeasuresNameMap</span>{<span class="k">lc</span><span class="s">(</span><span class="i">$SpecifiedMeasure</span><span class="s">)</span>}<span class="sc">;</span>
 | 
| 
 | 
  1243 1230 
 | 
| 
 | 
  1244 1231   <span class="i">$OptionsInfo</span>{<span class="w">VectorComparisonMode</span>} = <span class="i">$Options</span>{<span class="w">vectorcomparisonmode</span>}<span class="sc">;</span>
 | 
| 
 | 
  1245 1232 
 | 
| 
 | 
  1246 1233   <span class="i">$OptionsInfo</span>{<span class="w">SpecifiedVectorComparisonMeasure</span>} = <span class="i">$SpecifiedMeasure</span><span class="sc">;</span>
 | 
| 
 | 
  1247 1234   <span class="i">$OptionsInfo</span>{<span class="w">SpecifiedVectorComparisonMeasuresName</span>} = <span class="i">$SpecifiedComparisonMeasureName</span><span class="sc">;</span>
 | 
| 
 | 
  1248 1235   <span class="i">$OptionsInfo</span>{<span class="w">SpecifiedVectorComparisonMeasuresMethod</span>} = <span class="i">$SpecifiedComparisonMeasureMethod</span><span class="sc">;</span>
 | 
| 
 | 
  1249 1236 
 | 
| 
 | 
  1250 1237   <span class="c"># Setup specified vector comparison calculation modes...</span>
 | 
| 
 | 
  1251 1238   <span class="k">my</span><span class="s">(</span><span class="i">$SpecifiedFormulism</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1252 1239 
 | 
| 
 | 
  1253 1240   <span class="i">$SpecifiedFormulism</span> = <span class="i">$Options</span>{<span class="w">vectorcomparisonformulism</span>}<span class="sc">;</span>
 | 
| 
 | 
  1254 1241   <span class="i">$SpecifiedFormulism</span> =~ <span class="q">s/ //g</span><span class="sc">;</span>
 | 
| 
 | 
  1255 1242   <span class="k">if</span> <span class="s">(</span><span class="i">$SpecifiedFormulism</span> !~ <span class="q">/^(AlgebraicForm|BinaryForm|SetTheoreticForm)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1256 1243     <span class="k">die</span> <span class="q">"Error: The value specified, $SpecifiedFormulism, for option \"--VectorComparisonFormulism\" is not valid. Allowed values: AlgebraicForm, BinaryForm or SetTheoreticForm\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1257 1244   <span class="s">}</span>
 | 
| 
 | 
  1258 1245 
 | 
| 
 | 
  1259 1246   <span class="i">$OptionsInfo</span>{<span class="w">VectorComparisonFormulism</span>} = <span class="i">$Options</span>{<span class="w">vectorcomparisonformulism</span>}<span class="sc">;</span>
 | 
| 
 | 
  1260 1247   <span class="i">$OptionsInfo</span>{<span class="w">SpecifiedVectorComparisonMode</span>} = <span class="i">$SpecifiedFormulism</span><span class="sc">;</span>
 | 
| 
 | 
  1261 1248 
 | 
| 
 | 
  1262 1249 <span class="s">}</span>
 | 
| 
 | 
  1263 1250 
 | 
| 
 | 
  1264 1251 <span class="c"># Process options related to data retrieval from reference fingerprints SD and CSV/TSV</span>
 | 
| 
 | 
  1265 1252 <span class="c"># text files...</span>
 | 
| 
 | 
  1266 1253 <span class="c">#</span>
 | 
| 
 | 
  1267 <a name="ProcessReferenceFingerprintsDataOptions-"></a>1254 <span class="k">sub </span><span class="m">ProcessReferenceFingerprintsDataOptions</span> <span class="s">{</span>
 | 
| 
 | 
  1268 1255 
 | 
| 
 | 
  1269 1256   <span class="i">$OptionsInfo</span>{<span class="w">ReferenceCompoundIDPrefix</span>} = <span class="i">$Options</span>{<span class="w">referencecompoundidprefix</span>} ? <span class="i">$Options</span>{<span class="w">referencecompoundidprefix</span>} <span class="co">:</span> <span class="q">'Cmpd'</span><span class="sc">;</span>
 | 
| 
 | 
  1270 1257 
 | 
| 
 | 
  1271 1258   <span class="c"># Compound ID and fingerprints column options for text files...</span>
 | 
| 
 | 
  1272 1259 
 | 
| 
 | 
  1273 1260   <span class="i">$OptionsInfo</span>{<span class="w">ReferenceColMode</span>} = <span class="i">$Options</span>{<span class="w">referencecolmode</span>}<span class="sc">;</span>
 | 
| 
 | 
  1274 1261 
 | 
| 
 | 
  1275 1262   <span class="k">if</span> <span class="s">(</span><span class="i">IsNotEmpty</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">referencecompoundidcol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1276 1263     <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">referencecolmode</span>} =~ <span class="q">/^ColNum$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1277 1264       <span class="k">if</span> <span class="s">(</span>!<span class="i">IsPositiveInteger</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">referencecompoundidcol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1278 1265         <span class="k">die</span> <span class="q">"Error: Column value, $Options{referencecompoundidcol}, specified using \"--ReferenceCompoundIDCol\" is not valid: Allowed integer values: > 0\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1279 1266       <span class="s">}</span>
 | 
| 
 | 
  1280 1267     <span class="s">}</span>
 | 
| 
 | 
  1281 1268     <span class="i">$OptionsInfo</span>{<span class="w">ReferenceCompoundIDCol</span>} = <span class="i">$Options</span>{<span class="w">referencecompoundidcol</span>}<span class="sc">;</span>
 | 
| 
 | 
  1282 1269   <span class="s">}</span>
 | 
| 
 | 
  1283 1270   <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
  1284 1271     <span class="i">$OptionsInfo</span>{<span class="w">ReferenceCompoundIDCol</span>} = <span class="q">'AutoDetect'</span><span class="sc">;</span>
 | 
| 
 | 
  1285 1272   <span class="s">}</span>
 | 
| 
 | 
  1286 1273 
 | 
| 
 | 
  1287 1274   <span class="k">if</span> <span class="s">(</span><span class="i">IsNotEmpty</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">referencefingerprintscol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1288 1275     <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">referencecolmode</span>} =~ <span class="q">/^ColNum$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1289 1276       <span class="k">if</span> <span class="s">(</span>!<span class="i">IsPositiveInteger</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">referencefingerprintscol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1290 1277         <span class="k">die</span> <span class="q">"Error: Column value, $Options{referencefingerprintscol}, specified using \"--ReferenceFingerprintsCol\" is not valid: Allowed integer values: > 0\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1291 1278       <span class="s">}</span>
 | 
| 
 | 
  1292 1279     <span class="s">}</span>
 | 
| 
 | 
  1293 1280     <span class="i">$OptionsInfo</span>{<span class="w">ReferenceFingerprintsCol</span>} = <span class="i">$Options</span>{<span class="w">referencefingerprintscol</span>}<span class="sc">;</span>
 | 
| 
 | 
  1294 1281   <span class="s">}</span>
 | 
| 
 | 
  1295 1282   <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
  1296 1283     <span class="i">$OptionsInfo</span>{<span class="w">ReferenceFingerprintsCol</span>} = <span class="q">'AutoDetect'</span><span class="sc">;</span>
 | 
| 
 | 
  1297 1284   <span class="s">}</span>
 | 
| 
 | 
  1298 1285 
 | 
| 
 | 
  1299 1286   <span class="k">if</span> <span class="s">(</span><span class="i">IsNotEmpty</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">referencecompoundidcol</span>}<span class="s">)</span> && <span class="i">IsNotEmpty</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">referencefingerprintscol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1300 1287     <span class="k">if</span> <span class="s">(</span><span class="i">IsPositiveInteger</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">referencecompoundidcol</span>}<span class="s">)</span> && <span class="i">IsPositiveInteger</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">referencefingerprintscol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1301 1288       <span class="k">if</span> <span class="s">(</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">referencecompoundidcol</span>} == <span class="i">$Options</span>{<span class="w">referencefingerprintscol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1302 1289         <span class="k">die</span> <span class="q">"Error: Values specified using \"--ReferenceCompoundIDCol\" and \"--ReferenceFingerprintsCol\", $Options{referencecompoundidcol}, must be different.\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1303 1290       <span class="s">}</span>
 | 
| 
 | 
  1304 1291     <span class="s">}</span>
 | 
| 
 | 
  1305 1292     <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
  1306 1293       <span class="k">if</span> <span class="s">(</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">referencecompoundidcol</span>} <span class="k">eq</span> <span class="i">$Options</span>{<span class="w">referencefingerprintscol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1307 1294         <span class="k">die</span> <span class="q">"Error: Values specified using \"--ReferenceCompoundIDCol\" and \"--ReferenceFingerprintsCol\", $Options{referencecompoundidcol}, must be different.\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1308 1295       <span class="s">}</span>
 | 
| 
 | 
  1309 1296     <span class="s">}</span>
 | 
| 
 | 
  1310 1297   <span class="s">}</span>
 | 
| 
 | 
  1311 1298 
 | 
| 
 | 
  1312 1299   <span class="c"># Compound ID and fingerprints field options for SD files...</span>
 | 
| 
 | 
  1313 1300 
 | 
| 
 | 
  1314 1301   <span class="i">$OptionsInfo</span>{<span class="w">ReferenceCompoundIDMode</span>} = <span class="i">$Options</span>{<span class="w">referencecompoundidmode</span>}<span class="sc">;</span>
 | 
| 
 | 
  1315 1302   <span class="i">$OptionsInfo</span>{<span class="w">ReferenceCompoundIDField</span>} = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
  1316 1303 
 | 
| 
 | 
  1317 1304   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">referencecompoundidmode</span>} =~ <span class="q">/^DataField$/i</span> && !<span class="i">$Options</span>{<span class="w">referencecompoundidfield</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1318 1305     <span class="k">die</span> <span class="q">"Error: You must specify a value for \"--ReferenceCompoundIDField\" option in \"DataField\" \"--ReferenceCompoundIDMode\". \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1319 1306   <span class="s">}</span>
 | 
| 
 | 
  1320 1307   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">referencecompoundidfield</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1321 1308     <span class="i">$OptionsInfo</span>{<span class="w">ReferenceCompoundIDField</span>} = <span class="i">$Options</span>{<span class="w">referencecompoundidfield</span>}<span class="sc">;</span>
 | 
| 
 | 
  1322 1309   <span class="s">}</span>
 | 
| 
 | 
  1323 1310 
 | 
| 
 | 
  1324 1311   <span class="k">if</span> <span class="s">(</span><span class="i">IsNotEmpty</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">referencefingerprintsfield</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1325 1312     <span class="i">$OptionsInfo</span>{<span class="w">ReferenceFingerprintsField</span>} = <span class="i">$Options</span>{<span class="w">referencefingerprintsfield</span>}<span class="sc">;</span>
 | 
| 
 | 
  1326 1313   <span class="s">}</span>
 | 
| 
 | 
  1327 1314   <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
  1328 1315     <span class="i">$OptionsInfo</span>{<span class="w">ReferenceFingerprintsField</span>} = <span class="q">'AutoDetect'</span><span class="sc">;</span>
 | 
| 
 | 
  1329 1316   <span class="s">}</span>
 | 
| 
 | 
  1330 1317 
 | 
| 
 | 
  1331 1318   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">referencecompoundidfield</span>} && <span class="i">IsNotEmpty</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">referencefingerprintsfield</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1332 1319     <span class="k">if</span> <span class="s">(</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">referencecompoundidfield</span>} <span class="k">eq</span> <span class="i">$Options</span>{<span class="w">referencefingerprintsfield</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1333 1320       <span class="k">die</span> <span class="q">"Error: Values specified using \"--ReferenceCompoundIDField\" and \"--ReferenceFingerprintsfield\", $Options{referencecompoundidfield}, must be different.\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1334 1321     <span class="s">}</span>
 | 
| 
 | 
  1335 1322   <span class="s">}</span>
 | 
| 
 | 
  1336 1323 
 | 
| 
 | 
  1337 1324 <span class="s">}</span>
 | 
| 
 | 
  1338 1325 
 | 
| 
 | 
  1339 1326 <span class="c"># Process options related to data retrieval from database fingerprints SD and CSV/TSV</span>
 | 
| 
 | 
  1340 1327 <span class="c"># text files...</span>
 | 
| 
 | 
  1341 1328 <span class="c">#</span>
 | 
| 
 | 
  1342 <a name="ProcessDatabaseFingerprintsDataOptions-"></a>1329 <span class="k">sub </span><span class="m">ProcessDatabaseFingerprintsDataOptions</span> <span class="s">{</span>
 | 
| 
 | 
  1343 1330 
 | 
| 
 | 
  1344 1331   <span class="i">$OptionsInfo</span>{<span class="w">DatabaseCompoundIDPrefix</span>} = <span class="i">$Options</span>{<span class="w">databasecompoundidprefix</span>} ? <span class="i">$Options</span>{<span class="w">databasecompoundidprefix</span>} <span class="co">:</span> <span class="q">'Cmpd'</span><span class="sc">;</span>
 | 
| 
 | 
  1345 1332 
 | 
| 
 | 
  1346 1333   <span class="c"># Compound ID and fingerprints column options for text files...</span>
 | 
| 
 | 
  1347 1334 
 | 
| 
 | 
  1348 1335   <span class="i">$OptionsInfo</span>{<span class="w">DatabaseColMode</span>} = <span class="i">$Options</span>{<span class="w">databasecolmode</span>}<span class="sc">;</span>
 | 
| 
 | 
  1349 1336 
 | 
| 
 | 
  1350 1337   <span class="k">if</span> <span class="s">(</span><span class="i">IsNotEmpty</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">databasecompoundidcol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1351 1338     <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">databasecolmode</span>} =~ <span class="q">/^ColNum$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1352 1339       <span class="k">if</span> <span class="s">(</span>!<span class="i">IsPositiveInteger</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">databasecompoundidcol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1353 1340         <span class="k">die</span> <span class="q">"Error: Column value, $Options{databasecompoundidcol}, specified using \"--DatabaseCompoundIDCol\" is not valid: Allowed integer values: > 0\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1354 1341       <span class="s">}</span>
 | 
| 
 | 
  1355 1342     <span class="s">}</span>
 | 
| 
 | 
  1356 1343     <span class="i">$OptionsInfo</span>{<span class="w">DatabaseCompoundIDCol</span>} = <span class="i">$Options</span>{<span class="w">databasecompoundidcol</span>}<span class="sc">;</span>
 | 
| 
 | 
  1357 1344   <span class="s">}</span>
 | 
| 
 | 
  1358 1345   <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
  1359 1346     <span class="i">$OptionsInfo</span>{<span class="w">DatabaseCompoundIDCol</span>} = <span class="q">'AutoDetect'</span><span class="sc">;</span>
 | 
| 
 | 
  1360 1347   <span class="s">}</span>
 | 
| 
 | 
  1361 1348 
 | 
| 
 | 
  1362 1349   <span class="k">if</span> <span class="s">(</span><span class="i">IsNotEmpty</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">databasefingerprintscol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1363 1350     <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">databasecolmode</span>} =~ <span class="q">/^ColNum$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1364 1351       <span class="k">if</span> <span class="s">(</span>!<span class="i">IsPositiveInteger</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">databasefingerprintscol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1365 1352         <span class="k">die</span> <span class="q">"Error: Column value, $Options{databasefingerprintscol}, specified using \"--DatabaseFingerprintsCol\" is not valid: Allowed integer values: > 0\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1366 1353       <span class="s">}</span>
 | 
| 
 | 
  1367 1354     <span class="s">}</span>
 | 
| 
 | 
  1368 1355     <span class="i">$OptionsInfo</span>{<span class="w">DatabaseFingerprintsCol</span>} = <span class="i">$Options</span>{<span class="w">databasefingerprintscol</span>}<span class="sc">;</span>
 | 
| 
 | 
  1369 1356   <span class="s">}</span>
 | 
| 
 | 
  1370 1357   <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
  1371 1358     <span class="i">$OptionsInfo</span>{<span class="w">DatabaseFingerprintsCol</span>} = <span class="q">'AutoDetect'</span><span class="sc">;</span>
 | 
| 
 | 
  1372 1359   <span class="s">}</span>
 | 
| 
 | 
  1373 1360 
 | 
| 
 | 
  1374 1361   <span class="k">if</span> <span class="s">(</span><span class="i">IsNotEmpty</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">databasecompoundidcol</span>}<span class="s">)</span> && <span class="i">IsNotEmpty</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">databasefingerprintscol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1375 1362     <span class="k">if</span> <span class="s">(</span><span class="i">IsPositiveInteger</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">databasecompoundidcol</span>}<span class="s">)</span> && <span class="i">IsPositiveInteger</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">databasefingerprintscol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1376 1363       <span class="k">if</span> <span class="s">(</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">databasecompoundidcol</span>} == <span class="i">$Options</span>{<span class="w">databasefingerprintscol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1377 1364         <span class="k">die</span> <span class="q">"Error: Values specified using \"--DatabaseCompoundIDCol\" and \"--DatabaseFingerprintsCol\", $Options{databasecompoundidcol}, must be different.\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1378 1365       <span class="s">}</span>
 | 
| 
 | 
  1379 1366     <span class="s">}</span>
 | 
| 
 | 
  1380 1367     <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
  1381 1368       <span class="k">if</span> <span class="s">(</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">databasecompoundidcol</span>} <span class="k">eq</span> <span class="i">$Options</span>{<span class="w">databasefingerprintscol</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1382 1369         <span class="k">die</span> <span class="q">"Error: Values specified using \"--DatabaseCompoundIDCol\" and \"--DatabaseFingerprintsCol\", $Options{databasecompoundidcol}, must be different.\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1383 1370       <span class="s">}</span>
 | 
| 
 | 
  1384 1371     <span class="s">}</span>
 | 
| 
 | 
  1385 1372   <span class="s">}</span>
 | 
| 
 | 
  1386 1373 
 | 
| 
 | 
  1387 1374   <span class="c"># Database data column options for text files...</span>
 | 
| 
 | 
  1388 1375 
 | 
| 
 | 
  1389 1376   <span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataColsMode</span>} = <span class="i">$Options</span>{<span class="w">databasedatacolsmode</span>}<span class="sc">;</span>
 | 
| 
 | 
  1390 1377   <span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataCols</span>} = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
  1391 1378   <span class="i">@</span>{<span class="i">$OptionsInfo</span>{<span class="w">SpecifiedDatabaseDataCols</span>}} = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1392 1379 
 | 
| 
 | 
  1393 1380   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">databasedatacolsmode</span>} =~ <span class="q">/^Specify$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1394 1381     <span class="k">my</span><span class="s">(</span><span class="i">$DatabaseDataCols</span><span class="cm">,</span> <span class="i">$DatabaseColNum</span><span class="cm">,</span> <span class="i">@SpecifiedDataCols</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1395 1382 
 | 
| 
 | 
  1396 1383     <span class="k">if</span> <span class="s">(</span>!<span class="i">$Options</span>{<span class="w">databasedatacols</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1397 1384       <span class="k">die</span> <span class="q">"Error: You must specify a value for \"--DatabaseDataCols\" option in \"Specify\" \"--DatabaseDataColsMode\". \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1398 1385     <span class="s">}</span>
 | 
| 
 | 
  1399 1386     <span class="i">$DatabaseDataCols</span> = <span class="i">$Options</span>{<span class="w">databasedatacols</span>}<span class="sc">;</span>
 | 
| 
 | 
  1400 1387 
 | 
| 
 | 
  1401 1388     <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">databasecolmode</span>} =~ <span class="q">/^ColNum$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1402 1389       <span class="i">$DatabaseDataCols</span> =~ <span class="q">s/ //g</span><span class="sc">;</span>
 | 
| 
 | 
  1403 1390       <span class="i">@SpecifiedDataCols</span> = <span class="k">split</span> <span class="q">/\,/</span><span class="cm">,</span> <span class="i">$DatabaseDataCols</span><span class="sc">;</span>
 | 
| 
 | 
  1404 1391       <span class="k">for</span> <span class="i">$DatabaseColNum</span> <span class="s">(</span><span class="i">@SpecifiedDataCols</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1405 1392         <span class="k">if</span> <span class="s">(</span>!<span class="i">IsPositiveInteger</span><span class="s">(</span><span class="i">$DatabaseColNum</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1406 1393           <span class="k">die</span> <span class="q">"Error: Column value, $DatabaseColNum, specified using \"--DatabaseDataCols\" is not valid: Allowed integer values: > 0\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1407 1394         <span class="s">}</span>
 | 
| 
 | 
  1408 1395       <span class="s">}</span>
 | 
| 
 | 
  1409 1396     <span class="s">}</span>
 | 
| 
 | 
  1410 1397     <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
  1411 1398       <span class="i">@SpecifiedDataCols</span> = <span class="k">split</span> <span class="q">/\,/</span><span class="cm">,</span> <span class="i">$DatabaseDataCols</span><span class="sc">;</span>
 | 
| 
 | 
  1412 1399     <span class="s">}</span>
 | 
| 
 | 
  1413 1400     <span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataCols</span>} = <span class="i">$DatabaseDataCols</span><span class="sc">;</span>
 | 
| 
 | 
  1414 1401     <span class="k">push</span> <span class="i">@</span>{<span class="i">$OptionsInfo</span>{<span class="w">SpecifiedDatabaseDataCols</span>}}<span class="cm">,</span> <span class="i">@SpecifiedDataCols</span><span class="sc">;</span>
 | 
| 
 | 
  1415 1402   <span class="s">}</span>
 | 
| 
 | 
  1416 1403   <span class="k">elsif</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">databasedatacolsmode</span>} =~ <span class="q">/^All$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1417 1404     <span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataCols</span>} = <span class="q">'All'</span><span class="sc">;</span>
 | 
| 
 | 
  1418 1405   <span class="s">}</span>
 | 
| 
 | 
  1419 1406 
 | 
| 
 | 
  1420 1407   <span class="k">if</span> <span class="s">(</span><span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataColsMode</span>} =~ <span class="q">/^Specify$/i</span> && !<span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataCols</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1421 1408     <span class="k">die</span> <span class="q">"Error: You must specify a value for \"--DatabaseDataCols\" option in \"Specify\" \"--DatabaseDataColsMode\". \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1422 1409   <span class="s">}</span>
 | 
| 
 | 
  1423 1410 
 | 
| 
 | 
  1424 1411   <span class="c"># Compound ID and fingerprints field options for SD files...</span>
 | 
| 
 | 
  1425 1412 
 | 
| 
 | 
  1426 1413   <span class="i">$OptionsInfo</span>{<span class="w">DatabaseCompoundIDMode</span>} = <span class="i">$Options</span>{<span class="w">databasecompoundidmode</span>}<span class="sc">;</span>
 | 
| 
 | 
  1427 1414   <span class="i">$OptionsInfo</span>{<span class="w">DatabaseCompoundIDField</span>} = <span class="i">$Options</span>{<span class="w">databasecompoundidfield</span>} ? <span class="i">$Options</span>{<span class="w">databasecompoundidfield</span>} <span class="co">:</span> <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
  1428 1415 
 | 
| 
 | 
  1429 1416   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">databasecompoundidmode</span>} =~ <span class="q">/^DataField$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1430 1417     <span class="k">if</span> <span class="s">(</span>!<span class="i">$Options</span>{<span class="w">databasecompoundidfield</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1431 1418       <span class="k">die</span> <span class="q">"Error: You must specify a value for \"--DatabaseCompoundIDField\" option in \"DataField\" \"--DatabaseCompoundIDMode\". \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1432 1419     <span class="s">}</span>
 | 
| 
 | 
  1433 1420     <span class="i">$OptionsInfo</span>{<span class="w">DatabaseCompoundIDField</span>} = <span class="i">$Options</span>{<span class="w">databasecompoundidfield</span>}<span class="sc">;</span>
 | 
| 
 | 
  1434 1421   <span class="s">}</span>
 | 
| 
 | 
  1435 1422 
 | 
| 
 | 
  1436 1423 
 | 
| 
 | 
  1437 1424   <span class="k">if</span> <span class="s">(</span><span class="i">IsNotEmpty</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">databasefingerprintsfield</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1438 1425     <span class="i">$OptionsInfo</span>{<span class="w">DatabaseFingerprintsField</span>} = <span class="i">$Options</span>{<span class="w">databasefingerprintsfield</span>}<span class="sc">;</span>
 | 
| 
 | 
  1439 1426   <span class="s">}</span>
 | 
| 
 | 
  1440 1427   <span class="k">else</span> <span class="s">{</span>
 | 
| 
 | 
  1441 1428     <span class="i">$OptionsInfo</span>{<span class="w">DatabaseFingerprintsField</span>} = <span class="q">'AutoDetect'</span><span class="sc">;</span>
 | 
| 
 | 
  1442 1429   <span class="s">}</span>
 | 
| 
 | 
  1443 1430 
 | 
| 
 | 
  1444 1431   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">databasecompoundidfield</span>} && <span class="i">IsNotEmpty</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">databasefingerprintsfield</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1445 1432     <span class="k">if</span> <span class="s">(</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">databasecompoundidfield</span>} <span class="k">eq</span> <span class="i">$Options</span>{<span class="w">databasefingerprintsfield</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1446 1433       <span class="k">die</span> <span class="q">"Error: Values specified using \"--DatabaseCompoundIDField\" and \"--DatabaseFingerprintsfield\", $Options{databasecompoundidfield}, must be different.\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1447 1434     <span class="s">}</span>
 | 
| 
 | 
  1448 1435   <span class="s">}</span>
 | 
| 
 | 
  1449 1436 
 | 
| 
 | 
  1450 1437   <span class="c"># Database data field options for SD files...</span>
 | 
| 
 | 
  1451 1438 
 | 
| 
 | 
  1452 1439   <span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataFieldsMode</span>} = <span class="i">$Options</span>{<span class="w">databasedatafieldsmode</span>}<span class="sc">;</span>
 | 
| 
 | 
  1453 1440   <span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataFields</span>} = <span class="q">''</span><span class="sc">;</span>
 | 
| 
 | 
  1454 1441   <span class="i">@</span>{<span class="i">$OptionsInfo</span>{<span class="w">SpecifiedDatabaseDataFields</span>}} = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1455 1442 
 | 
| 
 | 
  1456 1443   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">databasedatafieldsmode</span>} =~ <span class="q">/^Specify$/i</span> && !<span class="i">$Options</span>{<span class="w">databasedatafields</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1457 1444     <span class="k">die</span> <span class="q">"Error: You must specify a value for \"--DatabaseDataFields\" option in \"Specify\" \"--DatabaseDataFieldsMode\". \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1458 1445   <span class="s">}</span>
 | 
| 
 | 
  1459 1446   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">databasedatafields</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1460 1447     <span class="k">my</span><span class="s">(</span><span class="i">@SpecifiedDataFields</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1461 1448     <span class="i">$OptionsInfo</span>{<span class="w">DatabaseDataFields</span>} = <span class="i">$Options</span>{<span class="w">databasedatafields</span>}<span class="sc">;</span>
 | 
| 
 | 
  1462 1449 
 | 
| 
 | 
  1463 1450     <span class="i">@SpecifiedDataFields</span> = <span class="k">split</span> <span class="q">/\,/</span><span class="cm">,</span> <span class="i">$Options</span>{<span class="w">databasedatafields</span>}<span class="sc">;</span>
 | 
| 
 | 
  1464 1451     <span class="k">push</span> <span class="i">@</span>{<span class="i">$OptionsInfo</span>{<span class="w">SpecifiedDatabaseDataFields</span>}}<span class="cm">,</span> <span class="i">@SpecifiedDataFields</span><span class="sc">;</span>
 | 
| 
 | 
  1465 1452   <span class="s">}</span>
 | 
| 
 | 
  1466 1453 <span class="s">}</span>
 | 
| 
 | 
  1467 1454 
 | 
| 
 | 
  1468 1455 <span class="c"># Setup script usage  and retrieve command line arguments specified using various options...</span>
 | 
| 
 | 
  1469 <a name="SetupScriptUsage-"></a>1456 <span class="k">sub </span><span class="m">SetupScriptUsage</span> <span class="s">{</span>
 | 
| 
 | 
  1470 1457 
 | 
| 
 | 
  1471 1458   <span class="c"># Retrieve all the options...</span>
 | 
| 
 | 
  1472 1459   <span class="i">%Options</span> = <span class="s">(</span><span class="s">)</span><span class="sc">;</span>
 | 
| 
 | 
  1473 1460 
 | 
| 
 | 
  1474 1461   <span class="i">$Options</span>{<span class="w">alpha</span>} = <span class="n">0.5</span><span class="sc">;</span>
 | 
| 
 | 
  1475 1462   <span class="i">$Options</span>{<span class="w">beta</span>} = <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
  1476 1463 
 | 
| 
 | 
  1477 1464   <span class="i">$Options</span>{<span class="w">bitvectorcomparisonmode</span>} = <span class="q">"TanimotoSimilarity"</span><span class="sc">;</span>
 | 
| 
 | 
  1478 1465 
 | 
| 
 | 
  1479 1466   <span class="i">$Options</span>{<span class="w">databasecolmode</span>} = <span class="q">'colnum'</span><span class="sc">;</span>
 | 
| 
 | 
  1480 1467 
 | 
| 
 | 
  1481 1468   <span class="i">$Options</span>{<span class="w">databasecompoundidprefix</span>} = <span class="q">'Cmpd'</span><span class="sc">;</span>
 | 
| 
 | 
  1482 1469   <span class="i">$Options</span>{<span class="w">databasecompoundidmode</span>} = <span class="q">'LabelPrefix'</span><span class="sc">;</span>
 | 
| 
 | 
  1483 1470 
 | 
| 
 | 
  1484 1471   <span class="i">$Options</span>{<span class="w">databasedatacolsmode</span>} = <span class="q">'CompoundID'</span><span class="sc">;</span>
 | 
| 
 | 
  1485 1472   <span class="i">$Options</span>{<span class="w">databasedatafieldsmode</span>} = <span class="q">'CompoundID'</span><span class="sc">;</span>
 | 
| 
 | 
  1486 1473 
 | 
| 
 | 
  1487 1474   <span class="i">$Options</span>{<span class="w">distancecutoff</span>} = <span class="n">10</span><span class="sc">;</span>
 | 
| 
 | 
  1488 1475 
 | 
| 
 | 
  1489 1476   <span class="i">$Options</span>{<span class="w">referencecolmode</span>} = <span class="q">'colnum'</span><span class="sc">;</span>
 | 
| 
 | 
  1490 1477 
 | 
| 
 | 
  1491 1478   <span class="i">$Options</span>{<span class="w">referencecompoundidprefix</span>} = <span class="q">'Cmpd'</span><span class="sc">;</span>
 | 
| 
 | 
  1492 1479   <span class="i">$Options</span>{<span class="w">referencecompoundidmode</span>} = <span class="q">'LabelPrefix'</span><span class="sc">;</span>
 | 
| 
 | 
  1493 1480 
 | 
| 
 | 
  1494 1481   <span class="i">$Options</span>{<span class="w">detail</span>} = <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
  1495 1482 
 | 
| 
 | 
  1496 1483   <span class="i">$Options</span>{<span class="w">fingerprintsmode</span>} = <span class="q">'AutoDetect'</span><span class="sc">;</span>
 | 
| 
 | 
  1497 1484   <span class="i">$Options</span>{<span class="w">groupfusionrule</span>} = <span class="q">'Max'</span><span class="sc">;</span>
 | 
| 
 | 
  1498 1485   <span class="i">$Options</span>{<span class="w">groupfusionapplycutoff</span>} = <span class="q">'Yes'</span><span class="sc">;</span>
 | 
| 
 | 
  1499 1486 
 | 
| 
 | 
  1500 1487   <span class="i">$Options</span>{<span class="w">knn</span>} = <span class="q">'All'</span><span class="sc">;</span>
 | 
| 
 | 
  1501 1488 
 | 
| 
 | 
  1502 1489   <span class="i">$Options</span>{<span class="w">mode</span>} = <span class="q">'MultipleReferences'</span><span class="sc">;</span>
 | 
| 
 | 
  1503 1490 
 | 
| 
 | 
  1504 1491   <span class="i">$Options</span>{<span class="w">numofsimilarmolecules</span>} = <span class="n">10</span><span class="sc">;</span>
 | 
| 
 | 
  1505 1492   <span class="i">$Options</span>{<span class="w">percentsimilarmolecules</span>} = <span class="n">1</span><span class="sc">;</span>
 | 
| 
 | 
  1506 1493 
 | 
| 
 | 
  1507 1494   <span class="i">$Options</span>{<span class="w">indelim</span>} = <span class="q">'comma'</span><span class="sc">;</span>
 | 
| 
 | 
  1508 1495   <span class="i">$Options</span>{<span class="w">outdelim</span>} = <span class="q">'comma'</span><span class="sc">;</span>
 | 
| 
 | 
  1509 1496   <span class="i">$Options</span>{<span class="w">quote</span>} = <span class="q">'yes'</span><span class="sc">;</span>
 | 
| 
 | 
  1510 1497 
 | 
| 
 | 
  1511 1498   <span class="i">$Options</span>{<span class="w">output</span>} = <span class="q">'text'</span><span class="sc">;</span>
 | 
| 
 | 
  1512 1499 
 | 
| 
 | 
  1513 1500   <span class="i">$Options</span>{<span class="w">precision</span>} = <span class="n">2</span><span class="sc">;</span>
 | 
| 
 | 
  1514 1501 
 | 
| 
 | 
  1515 1502   <span class="i">$Options</span>{<span class="w">searchmode</span>} = <span class="q">'SimilaritySearch'</span><span class="sc">;</span>
 | 
| 
 | 
  1516 1503 
 | 
| 
 | 
  1517 1504   <span class="i">$Options</span>{<span class="w">similarcountmode</span>} = <span class="q">'NumOfSimilar'</span><span class="sc">;</span>
 | 
| 
 | 
  1518 1505 
 | 
| 
 | 
  1519 1506   <span class="i">$Options</span>{<span class="w">similaritycutoff</span>} = <span class="n">0.75</span><span class="sc">;</span>
 | 
| 
 | 
  1520 1507 
 | 
| 
 | 
  1521 1508   <span class="i">$Options</span>{<span class="w">vectorcomparisonmode</span>} = <span class="q">'TanimotoSimilarity'</span><span class="sc">;</span>
 | 
| 
 | 
  1522 1509   <span class="i">$Options</span>{<span class="w">vectorcomparisonformulism</span>} = <span class="q">'AlgebraicForm'</span><span class="sc">;</span>
 | 
| 
 | 
  1523 1510 
 | 
| 
 | 
  1524 1511   <span class="k">if</span> <span class="s">(</span>!<span class="i">GetOptions</span><span class="s">(</span>\<span class="i">%Options</span><span class="cm">,</span> <span class="q">"alpha=f"</span><span class="cm">,</span> <span class="q">"beta=f"</span><span class="cm">,</span> <span class="q">"bitvectorcomparisonmode|b=s"</span><span class="cm">,</span> <span class="q">"databasecolmode=s"</span><span class="cm">,</span> <span class="q">"databasecompoundidcol=s"</span><span class="cm">,</span> <span class="q">"databasecompoundidprefix=s"</span><span class="cm">,</span> <span class="q">"databasecompoundidfield=s"</span><span class="cm">,</span> <span class="q">"databasecompoundidmode=s"</span><span class="cm">,</span> <span class="q">"databasedatacols=s"</span><span class="cm">,</span> <span class="q">"databasedatacolsmode=s"</span><span class="cm">,</span> <span class="q">"databasedatafields=s"</span><span class="cm">,</span> <span class="q">"databasedatafieldsmode=s"</span><span class="cm">,</span> <span class="q">"databasefingerprintscol=s"</span><span class="cm">,</span> <span class="q">"databasefingerprintsfield=s"</span><span class="cm">,</span> <span class="q">"distancecutoff=f"</span><span class="cm">,</span> <span class="q">"detail|d=i"</span><span class="cm">,</span> <span class="q">"fast|f"</span><span class="cm">,</span> <span class="q">"fingerprintsmode=s"</span><span class="cm">,</span> <span class="q">"groupfusionrule|g=s"</span><span class="cm">,</span> <span class="cm">,</span> <span class="q">"groupfusionapplycutoff=s"</span><span class="cm">,</span> <span class="q">"help|h"</span><span class="cm">,</span> <span class="q">"indelim=s"</span><span class="cm">,</span> <span class="q">"knn|k=s"</span><span class="cm">,</span> <span class="q">"mode|m=s"</span><span class="cm">,</span> <span class="q">"numofsimilarmolecules|n=i"</span><span class="cm">,</span> <span class="q">"outdelim=s"</span><span class="cm">,</span> <span class="q">"output=s"</span><span class="cm">,</span> <span class="q">"overwrite|o"</span><span class="cm">,</span> <span class="q">"percentsimilarmolecules|p=f"</span><span class="cm">,</span> <span class="q">"precision=s"</span><span class="cm">,</span> <span class="q">"quote|q=s"</span><span class="cm">,</span> <span class="q">"referencecolmode=s"</span><span class="cm">,</span> <span class="q">"referencecompoundidcol=s"</span><span class="cm">,</span> <span class="q">"referencecompoundidprefix=s"</span><span class="cm">,</span> <span class="q">"referencecompoundidfield=s"</span><span class="cm">,</span> <span class="q">"referencecompoundidmode=s"</span><span class="cm">,</span> <span class="q">"referencefingerprintscol=s"</span><span class="cm">,</span> <span class="q">"referencefingerprintsfield=s"</span><span class="cm">,</span> <span class="q">"root|r=s"</span><span class="cm">,</span> <span class="q">"searchmode|s=s"</span><span class="cm">,</span> <span class="q">"similarcountmode=s"</span><span class="cm">,</span> <span class="q">"similaritycutoff=f"</span><span class="cm">,</span> <span class="q">"vectorcomparisonmode|v=s"</span><span class="cm">,</span> <span class="q">"vectorcomparisonformulism=s"</span><span class="cm">,</span> <span class="q">"workingdir|w=s"</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1525 1512     <span class="k">die</span> <span class="q">"\nTo get a list of valid options and their values, use \"$ScriptName -h\" or\n\"perl -S $ScriptName -h\" command and try again...\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1526 1513   <span class="s">}</span>
 | 
| 
 | 
  1527 1514   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">workingdir</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1528 1515     <span class="k">if</span> <span class="s">(</span>! <span class="k">-d</span> <span class="i">$Options</span>{<span class="w">workingdir</span>}<span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1529 1516       <span class="k">die</span> <span class="q">"Error: The value specified, $Options{workingdir}, for option \"-w --workingdir\" is not a directory name.\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1530 1517     <span class="s">}</span>
 | 
| 
 | 
  1531 1518     <span class="k">chdir</span> <span class="i">$Options</span>{<span class="w">workingdir</span>} <span class="k">or</span> <span class="k">die</span> <span class="q">"Error: Couldn't chdir $Options{workingdir}: $! \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1532 1519   <span class="s">}</span>
 | 
| 
 | 
  1533 1520   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">databasecolmode</span>} !~ <span class="q">/^(ColNum|ColLabel)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1534 1521     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{databasecolmode}, for option \"--DatabaseColMode\" is not valid. Allowed values: ColNum, or ColLabel\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1535 1522   <span class="s">}</span>
 | 
| 
 | 
  1536 1523   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">databasecompoundidmode</span>} !~ <span class="q">/^(DataField|MolName|LabelPrefix|MolNameOrLabelPrefix)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1537 1524     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{databasecompoundidmode}, for option \"--DatabaseCompoundIDMode\" is not valid. Allowed values: DataField, MolName, LabelPrefix or MolNameOrLabelPrefix\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1538 1525   <span class="s">}</span>
 | 
| 
 | 
  1539 1526   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">databasedatacolsmode</span>} !~ <span class="q">/^(All|Specify|CompoundID)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1540 1527     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{databasedatacolsmode}, for option \"--DatabaseDataColsMode\" is not valid. Allowed values: All, Specify, or CompoundID\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1541 1528   <span class="s">}</span>
 | 
| 
 | 
  1542 1529   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">databasedatafieldsmode</span>} !~ <span class="q">/^(All|Common|Specify|CompoundID)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1543 1530     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{databasedatafieldsmode}, for option \"--DatabaseDataFieldsMode\" is not valid. Allowed values: All, Common, Specify, or CompoundID\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1544 1531   <span class="s">}</span>
 | 
| 
 | 
  1545 1532   <span class="k">if</span> <span class="s">(</span>!<span class="i">IsPositiveInteger</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">detail</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1546 1533     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{detail}, for option \"-d, --detail\" is not valid. Allowed values: > 0 \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1547 1534   <span class="s">}</span>
 | 
| 
 | 
  1548 1535   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">fingerprintsmode</span>} !~ <span class="q">/^(AutoDetect|FingerprintsBitVectorString|FingerprintsVectorString)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1549 1536     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{fingerprintsmode}, for option \"--FingerprintsMode\" is not valid. Allowed values: AutoDetect, FingerprintsBitVectorString or FingerprintsVectorString \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1550 1537   <span class="s">}</span>
 | 
| 
 | 
  1551 1538   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">groupfusionrule</span>} !~ <span class="q">/^(Max|Min|Mean|Median|Sum|Euclidean)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1552 1539     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{groupfusionrule}, for option \"-g, --GroupFusionRule\" is not valid. Allowed values: Max, Min, Mean, Median, Sum, Euclidean\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1553 1540   <span class="s">}</span>
 | 
| 
 | 
  1554 1541   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">groupfusionapplycutoff</span>} !~ <span class="q">/^(Yes|No)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1555 1542     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{quote}, for option \"--GroupFusionApplyCutoff\" is not valid. Allowed values: Yes or No\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1556 1543   <span class="s">}</span>
 | 
| 
 | 
  1557 1544   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">indelim</span>} !~ <span class="q">/^(comma|semicolon)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1558 1545     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{indelim}, for option \"--InDelim\" is not valid. Allowed values: comma, or semicolon\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1559 1546   <span class="s">}</span>
 | 
| 
 | 
  1560 1547   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">mode</span>} !~ <span class="q">/^(IndividualReference|MultipleReferences)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1561 1548     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{mode}, for option \"-m, --mode\" is not valid. Allowed values: IndividualReference, MultipleReferences\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1562 1549   <span class="s">}</span>
 | 
| 
 | 
  1563 1550   <span class="k">if</span> <span class="s">(</span>!<span class="i">IsPositiveInteger</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">numofsimilarmolecules</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1564 1551     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{numofsimilarmolecules}, for option \"-n, --NumOfSimilarMolecules\" is not valid. Allowed values: > 0 \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1565 1552   <span class="s">}</span>
 | 
| 
 | 
  1566 1553   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">outdelim</span>} !~ <span class="q">/^(comma|semicolon|tab)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1567 1554     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{outdelim}, for option \"--OutDelim\" is not valid. Allowed values: comma, tab, or semicolon\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1568 1555   <span class="s">}</span>
 | 
| 
 | 
  1569 1556   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">output</span>} !~ <span class="q">/^(SD|text|both)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1570 1557     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{output}, for option \"--output\" is not valid. Allowed values: SD, text, or both\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1571 1558   <span class="s">}</span>
 | 
| 
 | 
  1572 1559   <span class="k">if</span> <span class="s">(</span>!<span class="s">(</span><span class="i">IsFloat</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">percentsimilarmolecules</span>}<span class="s">)</span> && <span class="i">$Options</span>{<span class="w">percentsimilarmolecules</span>} > <span class="n">0</span> && <span class="i">$Options</span>{<span class="w">percentsimilarmolecules</span>} <= <span class="n">100</span><span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1573 1560     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{percentsimilarmolecules}, for option \"-p, --PercentSimilarMolecules\" is not valid. Allowed values: > 0 and <= 100 \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1574 1561   <span class="s">}</span>
 | 
| 
 | 
  1575 1562   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">quote</span>} !~ <span class="q">/^(Yes|No)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1576 1563     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{quote}, for option \"-q --quote\" is not valid. Allowed values: Yes or No\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1577 1564   <span class="s">}</span>
 | 
| 
 | 
  1578 1565   <span class="k">if</span> <span class="s">(</span>!<span class="i">IsPositiveInteger</span><span class="s">(</span><span class="i">$Options</span>{<span class="w">precision</span>}<span class="s">)</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1579 1566     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{precision}, for option \"--precision\" is not valid. Allowed values: > 0 \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1580 1567   <span class="s">}</span>
 | 
| 
 | 
  1581 1568   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">referencecolmode</span>} !~ <span class="q">/^(ColNum|ColLabel)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1582 1569     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{referencecolmode}, for option \"--ReferenceColMode\" is not valid. Allowed values: ColNum, or ColLabel\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1583 1570   <span class="s">}</span>
 | 
| 
 | 
  1584 1571   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">referencecompoundidmode</span>} !~ <span class="q">/^(DataField|MolName|LabelPrefix|MolNameOrLabelPrefix)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1585 1572     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{referencecompoundidmode}, for option \"--ReferenceCompoundIDMode\" is not valid. Allowed values: DataField, MolName, LabelPrefix or MolNameOrLabelPrefix\n"</span><span class="sc">;</span>
 | 
| 
 | 
  1586 1573   <span class="s">}</span>
 | 
| 
 | 
  1587 1574   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">searchmode</span>} !~ <span class="q">/^(SimilaritySearch|DissimilaritySearch)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1588 1575     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{searchmode}, for option \"-s, --SearchMode\" is not valid. Allowed values: SimilaritySearch, DissimilaritySearch \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1589 1576   <span class="s">}</span>
 | 
| 
 | 
  1590 1577   <span class="k">if</span> <span class="s">(</span><span class="i">$Options</span>{<span class="w">similarcountmode</span>} !~ <span class="q">/^(NumOfSimilar|PercentSimilar)$/i</span><span class="s">)</span> <span class="s">{</span>
 | 
| 
 | 
  1591 1578     <span class="k">die</span> <span class="q">"Error: The value specified, $Options{similarcountmode}, for option \"--SimilarCountMode\" is not valid. Allowed values: NumOfSimilar, PercentSimilar \n"</span><span class="sc">;</span>
 | 
| 
 | 
  1592 1579   <span class="s">}</span>
 | 
| 
 | 
  1593 1580 <span class="s">}</span>
 | 
| 
 | 
  1594 1581 
 | 
| 
 | 
  1595 <a name="EOF-"></a></pre>
 | 
| 
 | 
  1596 <p> </p>
 | 
| 
 | 
  1597 <br />
 | 
| 
 | 
  1598 <center>
 | 
| 
 | 
  1599 <img src="../../../images/h2o2.png">
 | 
| 
 | 
  1600 </center>
 | 
| 
 | 
  1601 </body>
 | 
| 
 | 
  1602 </html>
 |