Mercurial > repos > deepakjadmin > r_caret_test
comparison caret_future/tool2/modelBuilding.py @ 0:68300206e90d draft default tip
Uploaded
| author | deepakjadmin |
|---|---|
| date | Thu, 05 Nov 2015 02:41:30 -0500 |
| parents | |
| children |
comparison
equal
deleted
inserted
replaced
| -1:000000000000 | 0:68300206e90d |
|---|---|
| 1 def __inputArguments(): | |
| 2 | |
| 3 import argparse | |
| 4 parser = argparse.ArgumentParser() | |
| 5 | |
| 6 parser.add_argument("--method", nargs='?',default ='pls',help="Name of the method on which model will build; \ | |
| 7 Available Methods are:- pls, glm , glmboost ") | |
| 8 parser.add_argument("rdata",help="Descriptor file for model building") | |
| 9 parser.add_argument("--getdatainfoeval",nargs='?',default='TRUE',help="Validation of the data ") | |
| 10 parser.add_argument("--getdatainfoecho",nargs='?',default='FALSE',help="print on consol about Validity of the data ") | |
| 11 parser.add_argument("--getdatainforesult",nargs='?',default='hide',help="print in output file about Validity of the data ") | |
| 12 parser.add_argument("--missingfiltereval",nargs='?',default='FALSE',help="Processing step :: removal of missing value ") | |
| 13 parser.add_argument("--missingfilterecho",nargs='?',default='FALSE',help="print Processing step :: removal of missing value ") | |
| 14 parser.add_argument("--missingfilterresult",nargs='?',default='hide',help="print in output file about Processing step :: removal of missing value ") | |
| 15 parser.add_argument("--missingfilterthreshc",nargs='?',default=0.20,type=float,help="info about highly missing column data") | |
| 16 parser.add_argument("--missingfilterthreshr",nargs='?',default=0.20,type=float,help="info about highly missing row number") | |
| 17 parser.add_argument("--pcaeval",nargs='?',default='FALSE',help="PCA of data ") | |
| 18 parser.add_argument("--pcaecho",nargs='?',default='FALSE',help="PCA of data ") | |
| 19 parser.add_argument("--pcaresult",nargs='?',default='hide',help="print in file about PCA of data ") | |
| 20 parser.add_argument("--pcacomp",nargs='?',default=3,type=int,help="Number of PCA componant will be plotted ") | |
| 21 parser.add_argument("--pcaploteval",nargs='?',default='FALSE',help="PCA plot of data ") | |
| 22 parser.add_argument("--pcaplotecho",nargs='?',default='FALSE',help="print PCA plot of data ") | |
| 23 parser.add_argument("--pcaplotresult",nargs='?',default='hide',help="write in output file about PCA plot of data") | |
| 24 parser.add_argument("--pcaplotfig",nargs='?',default='TRUE',help="make figure file for integration in output file") | |
| 25 parser.add_argument("--initialdataspliteval",nargs='?',default='TRUE',help="data splitting in test and train set ") | |
| 26 parser.add_argument("--initialdatasplitecho",nargs='?',default='FALSE',help="print about data splitting in test and train set") | |
| 27 parser.add_argument("--initialdatasplitresult",nargs='?',default='hide',help="write in outputfile about data splitting in test and train set") | |
| 28 parser.add_argument("--saampling",nargs='?',default="garBage",help="Perform sampling from data") | |
| 29 parser.add_argument("--percent",nargs='?',default=0.8,type=float,help="percent value at which data splitting is done") | |
| 30 parser.add_argument("--nzveval",nargs='?',default='FALSE',help="remove near zero values") | |
| 31 parser.add_argument("--nzvresult",nargs='?',default='hide',help="write in outputfile about removing near zero values") | |
| 32 parser.add_argument("--nzvecho",nargs='?',default='FALSE',help="print about removing near zero values") | |
| 33 parser.add_argument("--corrfiltereval",nargs='?',default='FALSE',help="remove higly correlated values") | |
| 34 parser.add_argument("--corrfilterresult",nargs='?',default='hide',help="write in outputfile about removing highly correlated values") | |
| 35 parser.add_argument("--corrfilterecho",nargs='?',default='FALSE',help="print about removing correlated values") | |
| 36 parser.add_argument("--threshholdcor",nargs='?',default=0.75,type=float,help="percent value at which correlated values ommitted ") | |
| 37 parser.add_argument("--preproceval",nargs='?',default='FALSE',help="pre proccesing") | |
| 38 parser.add_argument("--preprocecho",nargs='?',default='FALSE',help="print about pre proccesing") | |
| 39 parser.add_argument("--preprocresult",nargs='?',default='hide',help="write in output file about pre proccesing") | |
| 40 parser.add_argument("--setupworkersecho",nargs='?',default='FALSE',help="print about number of processors") | |
| 41 parser.add_argument("--setupworkersresult",nargs='?',default='tex',help="write about number of processors in output file") | |
| 42 parser.add_argument("--numworkers",nargs='?',default=1,type=int,help="defines used processors") | |
| 43 parser.add_argument("--setupresamplingecho",nargs='?',default='FALSE',help="print resampling rules") | |
| 44 parser.add_argument("--setupresamplingresult",nargs='?',default='hide',help="write resampling rules in output file") | |
| 45 parser.add_argument("--resampname",nargs='?',default='boot632',help="choose type of resampling") | |
| 46 parser.add_argument("--resamplenumber",nargs='?',default=10,type=int,help="set number of resampling") | |
| 47 parser.add_argument("--numrepeat",nargs='?',default=3,type=int,help="set times of repeat") | |
| 48 parser.add_argument("--resamplenumberpercent",nargs='?',default=0.75,type=float,help="set PERCENT resampling") | |
| 49 parser.add_argument("--setupgridresult",nargs='?',default='hide',help="write about number of grids in output file") | |
| 50 parser.add_argument("--setupgridecho",nargs='?',default='FALSE',help="print about number of grids") | |
| 51 parser.add_argument("--setupgridsize",nargs='?',default=3,type=int,help="set number of grids") | |
| 52 parser.add_argument("--fitmodelresult",nargs='?',default='hide',help="write about model") | |
| 53 parser.add_argument("--fitmodelecho",nargs='?',default='FALSE',help="print about model") | |
| 54 parser.add_argument("--fitmodeleval",nargs='?',default='TRUE',help="start model building") | |
| 55 parser.add_argument("--modeldescrecho",nargs='?',default='FALSE',help="print model description") | |
| 56 parser.add_argument("--modeldescrresult",nargs='?',default='hide',help="write model description in outout file") | |
| 57 parser.add_argument("--resamptableecho",nargs='?',default='FALSE',help="print resample table") | |
| 58 parser.add_argument("--resamptableresult",nargs='?',default='tex',help="write resample table in output file") | |
| 59 parser.add_argument("--profileplotecho",nargs='?',default='FALSE',help="print about profile plots") | |
| 60 parser.add_argument("--profileplotfig",nargs='?',default='TRUE',help=" profile plots") | |
| 61 parser.add_argument("--stopworkersecho",nargs='?',default='FALSE',help="stop workers ie processors") | |
| 62 parser.add_argument("--stopworkersresult",nargs='?',default='hide',help="write about workers ie processors used") | |
| 63 parser.add_argument("--testpredresult",nargs='?',default='tex',help="write about statistical measure") | |
| 64 parser.add_argument("--testpredecho",nargs='?',default='FALSE',help="print about statistical measure") | |
| 65 parser.add_argument("--classprobstexresult",nargs='?',default='tex',help="paste various figure of statistical measure in outputfile") | |
| 66 parser.add_argument("--classprobstexecho",nargs='?',default='FALSE',help="print various figure of statistical measure") | |
| 67 parser.add_argument("--classprobstexresult1",nargs='?',default='hide',help="create roc curve in outputfile") | |
| 68 parser.add_argument("--classprobstexecho1",nargs='?',default='FALSE',help="print figure of statistical measure") | |
| 69 parser.add_argument("--savedataecho",nargs='?',default='FALSE',help="information about completion of model building ") | |
| 70 parser.add_argument("--savedataresult",nargs='?',default='hide',help="write information about completion of model building in outputfile ") | |
| 71 parser.add_argument("--datasets", help="name of the generated datasets") | |
| 72 parser.add_argument("--outputmodel", help="give name for the generated model") | |
| 73 parser.add_argument("--outputresultpdf", help="give name for the output pdf file") | |
| 74 | |
| 75 args = parser.parse_args() | |
| 76 return args | |
| 77 | |
| 78 def generateRnwScript(): | |
| 79 | |
| 80 import templateLibrary | |
| 81 t = templateLibrary.__template4Rnw() | |
| 82 | |
| 83 from string import Template | |
| 84 s = Template(t) | |
| 85 | |
| 86 args = __inputArguments() | |
| 87 | |
| 88 templt = s.safe_substitute(METHOD=args.method, | |
| 89 RDATA=args.rdata, | |
| 90 GETDATAINFOEVAL=args.getdatainfoeval, | |
| 91 GETDATAINFOECHO=args.getdatainfoecho, | |
| 92 GETDATAINFORESULT=args.getdatainforesult, | |
| 93 MISSINGFILTEREVAL=args.missingfiltereval, | |
| 94 MISSINGFILTERECHO=args.missingfilterecho, | |
| 95 MISSINGFILTERRESULT=args.missingfilterresult, | |
| 96 MISSINGFILTERTHRESHC=args.missingfilterthreshc, | |
| 97 MISSINGFILTERTHRESHR=args.missingfilterthreshr, | |
| 98 PCAEVAL=args.pcaeval, | |
| 99 PCAECHO=args.pcaecho, | |
| 100 PCARESULT=args.pcaresult, | |
| 101 PCACOMP=args.pcacomp, | |
| 102 PCAPLOTEVAL=args.pcaploteval, | |
| 103 PCAPLOTECHO=args.pcaplotecho, | |
| 104 PCAPLOTRESULT=args.pcaplotresult, | |
| 105 PCAPLOTFIG=args.pcaplotfig, | |
| 106 INITIALDATASPLITEVAL=args.initialdataspliteval, | |
| 107 INITIALDATASPLITECHO=args.initialdatasplitecho, | |
| 108 INITIALDATASPLITRESULT=args.initialdatasplitresult, | |
| 109 SAAMPLING=args.saampling, | |
| 110 PERCENT=args.percent, | |
| 111 NZVEVAL=args.nzveval, | |
| 112 NZVRESULT=args.nzvresult, | |
| 113 NZVECHO=args.nzvecho, | |
| 114 CORRFILTEREVAL=args.corrfiltereval, | |
| 115 CORRFILTERRESULT=args.corrfilterresult, | |
| 116 CORRFILTERECHO=args.corrfilterecho, | |
| 117 THRESHHOLDCOR=args.threshholdcor, | |
| 118 PREPROCEVAL=args.preproceval, | |
| 119 PREPROCECHO=args.preprocecho, | |
| 120 PREPROCRESULT=args.preprocresult, | |
| 121 SETUPWORKERSECHO=args.setupworkersecho, | |
| 122 SETUPWORKERSRESULT=args.setupworkersresult, | |
| 123 NUMWORKERS=args.numworkers, | |
| 124 SETUPRESAMPLINGECHO=args.setupresamplingecho, | |
| 125 SETUPRESAMPLINGRESULT=args.setupresamplingresult, | |
| 126 RESAMPNAME=args.resampname, | |
| 127 RESAMPLENUMBER=args.resamplenumber, | |
| 128 NUMREPEAT=args.numrepeat, | |
| 129 RESAMPLENUMBERPERCENT=args.resamplenumberpercent, | |
| 130 SETUPGRIDRESULT=args.setupgridresult, | |
| 131 SETUPGRIDECHO=args.setupgridecho, | |
| 132 SETUPGRIDSIZE=args.setupgridsize, | |
| 133 FITMODELRESULT=args.fitmodelresult, | |
| 134 FITMODELECHO=args.fitmodelecho, | |
| 135 FITMODELEVAL=args.fitmodeleval, | |
| 136 MODELDESCRECHO=args.modeldescrecho, | |
| 137 MODELDESCRRESULT=args.modeldescrresult, | |
| 138 RESAMPTABLEECHO=args.resamptableecho, | |
| 139 RESAMPTABLERESULT=args.resamptableresult, | |
| 140 PROFILEPLOTECHO=args.profileplotecho, | |
| 141 PROFILEPLOTFIG=args.profileplotfig, | |
| 142 STOPWORKERSECHO=args.stopworkersecho, | |
| 143 STOPWORKERSRESULT=args.stopworkersresult, | |
| 144 TESTPREDRESULT=args.testpredresult, | |
| 145 TESTPREDECHO=args.testpredecho, | |
| 146 CLASSPROBSTEXRESULT=args.classprobstexresult, | |
| 147 CLASSPROBSTEXECHO=args.classprobstexecho, | |
| 148 CLASSPROBSTEXRESULT1=args.classprobstexresult1, | |
| 149 CLASSPROBSTEXECHO1=args.classprobstexecho1, | |
| 150 SAVEDATAECHO=args.savedataecho, | |
| 151 SAVEDATARESULT=args.savedataresult ) | |
| 152 | |
| 153 | |
| 154 f = open('result-doc.Rnw','w') | |
| 155 f.write(templt) | |
| 156 f.close() | |
| 157 | |
| 158 def modelBuilding(): | |
| 159 | |
| 160 import os | |
| 161 os.system('R CMD Sweave result-doc.Rnw > cmd.log.1 2>&1') | |
| 162 os.system('pdflatex result-doc.tex > cmd.log.2 2>&1') | |
| 163 os.system('pdflatex result-doc.tex > cmd.log.2 2>&1') | |
| 164 # os.system('pdflatex result-doc.tex 2>&1 | tee cmd.log.2') | |
| 165 args = __inputArguments() | |
| 166 | |
| 167 from string import Template | |
| 168 s1 = Template('cp $METHOD-Fit.RData $OUTPUTMODEL') | |
| 169 s2 = Template('cp result-doc.pdf $OUTPUTRESULTPDF') | |
| 170 s3 = Template('cp datasets.RData $DATASETS') | |
| 171 | |
| 172 cmd1 = s1.safe_substitute(METHOD=args.method, OUTPUTMODEL=args.outputmodel) | |
| 173 cmd2 = s2.safe_substitute(OUTPUTRESULTPDF=args.outputresultpdf) | |
| 174 cmd3 = s3.safe_substitute(DATASETS=args.datasets) | |
| 175 | |
| 176 os.system(cmd1) | |
| 177 os.system(cmd2) | |
| 178 os.system(cmd3) | |
| 179 | |
| 180 if __name__ == "__main__" : | |
| 181 | |
| 182 generateRnwScript() | |
| 183 modelBuilding() |
