annotate docs/scripts/man1/ExtractFromTextFiles.1 @ 0:4816e4a8ae95 draft default tip

Uploaded
author deepakjadmin
date Wed, 20 Jan 2016 09:23:18 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
1 .\" Automatically generated by Pod::Man 2.25 (Pod::Simple 3.22)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
2 .\"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
3 .\" Standard preamble:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
4 .\" ========================================================================
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
5 .de Sp \" Vertical space (when we can't use .PP)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
6 .if t .sp .5v
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
7 .if n .sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
8 ..
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
9 .de Vb \" Begin verbatim text
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
10 .ft CW
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
11 .nf
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
12 .ne \\$1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
13 ..
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
14 .de Ve \" End verbatim text
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
15 .ft R
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
16 .fi
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
17 ..
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
18 .\" Set up some character translations and predefined strings. \*(-- will
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
19 .\" give an unbreakable dash, \*(PI will give pi, \*(L" will give a left
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
20 .\" double quote, and \*(R" will give a right double quote. \*(C+ will
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
21 .\" give a nicer C++. Capital omega is used to do unbreakable dashes and
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
22 .\" therefore won't be available. \*(C` and \*(C' expand to `' in nroff,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
23 .\" nothing in troff, for use with C<>.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
24 .tr \(*W-
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
25 .ds C+ C\v'-.1v'\h'-1p'\s-2+\h'-1p'+\s0\v'.1v'\h'-1p'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
26 .ie n \{\
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
27 . ds -- \(*W-
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
28 . ds PI pi
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
29 . if (\n(.H=4u)&(1m=24u) .ds -- \(*W\h'-12u'\(*W\h'-12u'-\" diablo 10 pitch
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
30 . if (\n(.H=4u)&(1m=20u) .ds -- \(*W\h'-12u'\(*W\h'-8u'-\" diablo 12 pitch
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
31 . ds L" ""
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
32 . ds R" ""
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
33 . ds C` ""
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
34 . ds C' ""
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
35 'br\}
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
36 .el\{\
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
37 . ds -- \|\(em\|
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
38 . ds PI \(*p
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
39 . ds L" ``
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
40 . ds R" ''
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
41 'br\}
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
42 .\"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
43 .\" Escape single quotes in literal strings from groff's Unicode transform.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
44 .ie \n(.g .ds Aq \(aq
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
45 .el .ds Aq '
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
46 .\"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
47 .\" If the F register is turned on, we'll generate index entries on stderr for
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
48 .\" titles (.TH), headers (.SH), subsections (.SS), items (.Ip), and index
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
49 .\" entries marked with X<> in POD. Of course, you'll have to process the
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
50 .\" output yourself in some meaningful fashion.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
51 .ie \nF \{\
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
52 . de IX
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
53 . tm Index:\\$1\t\\n%\t"\\$2"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
54 ..
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
55 . nr % 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
56 . rr F
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
57 .\}
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
58 .el \{\
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
59 . de IX
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
60 ..
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
61 .\}
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
62 .\"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
63 .\" Accent mark definitions (@(#)ms.acc 1.5 88/02/08 SMI; from UCB 4.2).
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
64 .\" Fear. Run. Save yourself. No user-serviceable parts.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
65 . \" fudge factors for nroff and troff
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
66 .if n \{\
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
67 . ds #H 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
68 . ds #V .8m
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
69 . ds #F .3m
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
70 . ds #[ \f1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
71 . ds #] \fP
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
72 .\}
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
73 .if t \{\
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
74 . ds #H ((1u-(\\\\n(.fu%2u))*.13m)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
75 . ds #V .6m
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
76 . ds #F 0
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
77 . ds #[ \&
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
78 . ds #] \&
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
79 .\}
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
80 . \" simple accents for nroff and troff
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
81 .if n \{\
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
82 . ds ' \&
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
83 . ds ` \&
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
84 . ds ^ \&
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
85 . ds , \&
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
86 . ds ~ ~
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
87 . ds /
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
88 .\}
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
89 .if t \{\
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
90 . ds ' \\k:\h'-(\\n(.wu*8/10-\*(#H)'\'\h"|\\n:u"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
91 . ds ` \\k:\h'-(\\n(.wu*8/10-\*(#H)'\`\h'|\\n:u'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
92 . ds ^ \\k:\h'-(\\n(.wu*10/11-\*(#H)'^\h'|\\n:u'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
93 . ds , \\k:\h'-(\\n(.wu*8/10)',\h'|\\n:u'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
94 . ds ~ \\k:\h'-(\\n(.wu-\*(#H-.1m)'~\h'|\\n:u'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
95 . ds / \\k:\h'-(\\n(.wu*8/10-\*(#H)'\z\(sl\h'|\\n:u'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
96 .\}
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
97 . \" troff and (daisy-wheel) nroff accents
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
98 .ds : \\k:\h'-(\\n(.wu*8/10-\*(#H+.1m+\*(#F)'\v'-\*(#V'\z.\h'.2m+\*(#F'.\h'|\\n:u'\v'\*(#V'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
99 .ds 8 \h'\*(#H'\(*b\h'-\*(#H'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
100 .ds o \\k:\h'-(\\n(.wu+\w'\(de'u-\*(#H)/2u'\v'-.3n'\*(#[\z\(de\v'.3n'\h'|\\n:u'\*(#]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
101 .ds d- \h'\*(#H'\(pd\h'-\w'~'u'\v'-.25m'\f2\(hy\fP\v'.25m'\h'-\*(#H'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
102 .ds D- D\\k:\h'-\w'D'u'\v'-.11m'\z\(hy\v'.11m'\h'|\\n:u'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
103 .ds th \*(#[\v'.3m'\s+1I\s-1\v'-.3m'\h'-(\w'I'u*2/3)'\s-1o\s+1\*(#]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
104 .ds Th \*(#[\s+2I\s-2\h'-\w'I'u*3/5'\v'-.3m'o\v'.3m'\*(#]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
105 .ds ae a\h'-(\w'a'u*4/10)'e
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
106 .ds Ae A\h'-(\w'A'u*4/10)'E
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
107 . \" corrections for vroff
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
108 .if v .ds ~ \\k:\h'-(\\n(.wu*9/10-\*(#H)'\s-2\u~\d\s+2\h'|\\n:u'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
109 .if v .ds ^ \\k:\h'-(\\n(.wu*10/11-\*(#H)'\v'-.4m'^\v'.4m'\h'|\\n:u'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
110 . \" for low resolution devices (crt and lpr)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
111 .if \n(.H>23 .if \n(.V>19 \
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
112 \{\
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
113 . ds : e
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
114 . ds 8 ss
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
115 . ds o a
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
116 . ds d- d\h'-1'\(ga
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
117 . ds D- D\h'-1'\(hy
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
118 . ds th \o'bp'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
119 . ds Th \o'LP'
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
120 . ds ae ae
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
121 . ds Ae AE
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
122 .\}
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
123 .rm #[ #] #H #V #F C
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
124 .\" ========================================================================
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
125 .\"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
126 .IX Title "EXTRACTFROMTEXTFILES 1"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
127 .TH EXTRACTFROMTEXTFILES 1 "2015-03-29" "perl v5.14.2" "MayaChemTools"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
128 .\" For nroff, turn off justification. Always turn off hyphenation; it makes
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
129 .\" way too many mistakes in technical documents.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
130 .if n .ad l
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
131 .nh
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
132 .SH "NAME"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
133 ExtractFromTextFiles.pl \- Extract specific data from TextFile(s)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
134 .SH "SYNOPSIS"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
135 .IX Header "SYNOPSIS"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
136 ExtractFromTextFiles.pl TextFile(s)...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
137 .PP
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
138 ExtractFromTextFiles.pl [\fB\-c, \-\-colmode\fR colnum | collabel] [\fB\-\-categorycol \fR number | string]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
139 [\fB\-\-columns\fR \*(L"colnum,[colnum]...\*(R" | \*(L"collabel,[collabel]...\*(R"] [\fB\-h, \-\-help\fR]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
140 [\fB\-\-indelim\fR \fIcomma | semicolon\fR] [\fB\-m, \-\-mode \fR \fIcolumns | rows | categories\fR]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
141 [\fB\-o, \-\-overwrite\fR] [\fB\-\-outdelim\fR \fIcomma | tab | semicolon\fR] [\fB\-q, \-\-quote\fR \fIyes | no\fR]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
142 [\fB\-\-rows\fR \*(L"colid,value,criteria...\*(R" | \*(L"colid,value...\*(R" | \*(L"colid,mincolvalue,maxcolvalue\*(R" | \*(L"rownum,rownum,...\*(R" | colid | \*(L"minrownum,maxrownum\*(R"]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
143 [ \fB\-\-rowsmode\fR rowsbycolvalue | rowsbycolvaluelist | rowsbycolvaluerange | rowbymincolvalue | rowbymaxcolvalue | rownums | rownumrange]
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
144 [\fB\-r, \-\-root\fR \fIrootname\fR] [\fB\-w, \-\-workingdir\fR \fIdirname\fR] TextFile(s)...
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
145 .SH "DESCRIPTION"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
146 .IX Header "DESCRIPTION"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
147 Extract column(s)/row(s) data from \fITextFile(s)\fR identified by column numbers or labels. Or categorize
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
148 data using a specified column category. During categorization, a summary text file is
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
149 generated containing category name and count; an additional text file, containing data for
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
150 for each category, is also generated. The file names are separated by space. The
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
151 valid file extensions are \fI.csv\fR and \fI.tsv\fR for comma/semicolon and tab delimited
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
152 text files respectively. All other file names are ignored. All the text files in a
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
153 current directory can be specified by \fI*.csv\fR, \fI*.tsv\fR, or the current directory
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
154 name. The \fB\-\-indelim\fR option determines the format of \fITextFile(s)\fR. Any file
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
155 which doesn't correspond to the format indicated by \fB\-\-indelim\fR option is ignored.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
156 .SH "OPTIONS"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
157 .IX Header "OPTIONS"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
158 .IP "\fB\-c, \-\-colmode\fR \fIcolnum | collabel\fR" 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
159 .IX Item "-c, --colmode colnum | collabel"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
160 Specify how columns are identified in \fITextFile(s)\fR: using column number or column
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
161 label. Possible values: \fIcolnum or collabel\fR. Default value: \fIcolnum\fR.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
162 .IP "\fB\-\-categorycol \fR \fInumber | string\fR" 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
163 .IX Item "--categorycol number | string"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
164 Column used to categorize data. Default value: First column.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
165 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
166 For \fIcolnum\fR value of \fB\-c, \-\-colmode\fR option, input value is a column number.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
167 Example: \fI1\fR.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
168 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
169 For \fIcollabel\fR value of \fB\-c, \-\-colmode\fR option, input value is a column label.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
170 Example: \fIMol_ID\fR.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
171 .ie n .IP "\fB\-\-columns\fR \fI""colnum,[colnum]..."" | ""collabel,[collabel]...""\fR" 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
172 .el .IP "\fB\-\-columns\fR \fI``colnum,[colnum]...'' | ``collabel,[collabel]...''\fR" 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
173 .IX Item "--columns colnum,[colnum]... | collabel,[collabel]..."
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
174 List of comma delimited columns to extract. Default value: First column.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
175 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
176 For \fIcolnum\fR value of \fB\-c, \-\-colmode\fR option, input values format is:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
177 \&\fIcolnum,colnum,...\fR. Example: \fI1,3,5\fR
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
178 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
179 For \fIcollabel\fR value of \fB\-c, \-\-colmode\fR option, input values format is:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
180 \&\fIcollabel,collabel,..\fR. Example: \fIMol_ID,MolWeight\fR
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
181 .IP "\fB\-h, \-\-help\fR" 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
182 .IX Item "-h, --help"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
183 Print this help message.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
184 .IP "\fB\-\-indelim\fR \fIcomma | semicolon\fR" 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
185 .IX Item "--indelim comma | semicolon"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
186 Input delimiter for \s-1CSV\s0 \fITextFile(s)\fR. Possible values: \fIcomma or semicolon\fR.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
187 Default value: \fIcomma\fR. For \s-1TSV\s0 files, this option is ignored and \fItab\fR is used as a
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
188 delimiter.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
189 .IP "\fB\-m, \-\-mode \fR \fIcolumns | rows | categories\fR" 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
190 .IX Item "-m, --mode columns | rows | categories"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
191 Specify what to extract from \fITextFile(s)\fR. Possible values: \fIcolumns, rows,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
192 or categories\fR. Default value: \fIcolumns\fR.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
193 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
194 For \fIcolumns\fR mode, data for appropriate columns specified by \fB\-\-columns\fR option
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
195 is extracted from \fITextFile(s)\fR and placed into new text files.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
196 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
197 For \fIrows\fR mode, appropriate rows specified in conjuction with \fB\-\-rowsmode\fR and
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
198 \&\fBrows\fR options are extracted from \fITextFile(s)\fR and placed into new text files.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
199 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
200 For \fIcategories\fR mode, coulmn specified by \fB\-\-categorycol\fR is
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
201 used to categorize data, and a summary text file is generated
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
202 containing category name and count; an additional text file, containing data for
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
203 for each category, is also generated.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
204 .IP "\fB\-o, \-\-overwrite\fR" 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
205 .IX Item "-o, --overwrite"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
206 Overwrite existing files.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
207 .IP "\fB\-\-outdelim\fR \fIcomma | tab | semicolon\fR." 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
208 .IX Item "--outdelim comma | tab | semicolon."
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
209 Output text file delimiter. Possible values: \fIcomma, tab, or semicolon\fR.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
210 Default value: \fIcomma\fR
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
211 .IP "\fB\-q, \-\-quote\fR \fIyes | no\fR" 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
212 .IX Item "-q, --quote yes | no"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
213 Put quotes around column values in output text file. Possible values: \fIyes or
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
214 no\fR. Default value: \fIyes\fR.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
215 .IP "\fB\-r, \-\-root\fR \fIrootname\fR" 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
216 .IX Item "-r, --root rootname"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
217 New file name is generated using the root: <Root>.<Ext>. Default for new file
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
218 names: <TextFile>CategoriesSummary.<Ext>, <TextFile>ExtractedColumns.<Ext>, and
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
219 <TextFile>ExtractedRows.<Ext> for \fIcategories\fR, \fIcolumns\fR, and \fIrows\fR mode
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
220 respectively. And <TextFile>Category<CategoryName>.<Ext>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
221 for each category retrieved from each text file. The output file type determines <Ext>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
222 value: csv and tsv for \s-1CSV\s0, and \s-1TSV\s0 files respectively.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
223 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
224 This option is ignored for multiple input files.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
225 .ie n .IP "\fB\-\-rows\fR \fI""colid,value,criteria..."" | ""colid,value..."" | ""colid,mincolvalue,maxcolvalue"" | ""rownum,rownum,..."" | colid | ""minrownum,maxrownum""\fR" 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
226 .el .IP "\fB\-\-rows\fR \fI``colid,value,criteria...'' | ``colid,value...'' | ``colid,mincolvalue,maxcolvalue'' | ``rownum,rownum,...'' | colid | ``minrownum,maxrownum''\fR" 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
227 .IX Item "--rows colid,value,criteria... | colid,value... | colid,mincolvalue,maxcolvalue | rownum,rownum,... | colid | minrownum,maxrownum"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
228 This value is \fB\-\-rowsmode\fR specific. In general, it's a list of comma separated column ids and
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
229 associated mode specific value. Based on Column ids specification, column label or number, is
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
230 controlled by \fB\-c, \-\-colmode\fR option.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
231 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
232 First line containing column labels is always written out. And value comparisons assume
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
233 numerical column data.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
234 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
235 For \fIrowsbycolvalue\fR mode, input value format contains these triplets:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
236 \&\fIcolid,value, criteria...\fR. Possible values for criteria: \fIle, ge or eq\fR.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
237 Examples:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
238 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
239 .Vb 2
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
240 \& MolWt,450,le
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
241 \& MolWt,450,le,LogP,5,le,SumNumNO,10,le,SumNHOH,5,le
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
242 .Ve
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
243 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
244 For \fIrowsbycolvaluelist\fR mode, input value format is: \fIcolid,value...\fR. Examples:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
245 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
246 .Vb 2
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
247 \& Mol_ID,20
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
248 \& Mol_ID,20,1002,1115
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
249 .Ve
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
250 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
251 For \fIrowsbycolvaluerange\fR mode, input value format is: \fIcolid,mincolvalue,maxcolvalue\fR. Examples:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
252 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
253 .Vb 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
254 \& MolWt,100,450
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
255 .Ve
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
256 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
257 For \fIrowbymincolvalue, rowbymaxcolvalue\fR modes, input value format is: \fIcolid\fR.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
258 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
259 For \fIrownum\fR mode, input value format is: \fIrownum\fR. Default value: \fI2\fR.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
260 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
261 For \fIrownumrange\fR mode, input value format is: \fIminrownum, maxrownum\fR. Examples:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
262 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
263 .Vb 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
264 \& 10,40
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
265 .Ve
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
266 .IP "\fB\-\-rowsmode\fR \fIrowsbycolvalue | rowsbycolvaluelist | rowsbycolvaluerange | rowbymincolvalue | rowbymaxcolvalue | rownums | rownumrange\fR" 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
267 .IX Item "--rowsmode rowsbycolvalue | rowsbycolvaluelist | rowsbycolvaluerange | rowbymincolvalue | rowbymaxcolvalue | rownums | rownumrange"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
268 Specify how to extract rows from \fITextFile(s)\fR. Possible values: \fIrowsbycolvalue, rowsbycolvaluelist, rowsbycolvaluerange,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
269 rowbymincolvalue, rowbymaxcolvalue, rownum, rownumrange\fR. Default value: \fIrownum\fR.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
270 .Sp
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
271 Use \fB\-\-rows\fR option to list rows criterion used for extraction of rows from
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
272 \&\fITextFile(s)\fR.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
273 .IP "\fB\-w, \-\-workingdir\fR \fIdirname\fR" 4
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
274 .IX Item "-w, --workingdir dirname"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
275 Location of working directory. Default: current directory.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
276 .SH "EXAMPLES"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
277 .IX Header "EXAMPLES"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
278 To extract first column from a text file and generate a new \s-1CSV\s0 text file NewSample1.csv,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
279 type:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
280 .PP
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
281 .Vb 1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
282 \& % ExtractFromTextFiles.pl \-r NewSample1 \-o Sample1.csv
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
283 .Ve
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
284 .PP
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
285 To extract columns Mol_ID, MolWeight, and \s-1NAME\s0 from Sample1.csv and generate a new
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
286 textfile NewSample1.tsv with no quotes, type:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
287 .PP
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
288 .Vb 3
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
289 \& % ExtractFromTextFiles.pl \-m columns \-c collabel \-\-columns "Mol_ID,
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
290 \& MolWeight,NAME" \-\-outdelim tab \-\-quote no \-r NewSample1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
291 \& \-o Sample1.csv
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
292 .Ve
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
293 .PP
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
294 To extract rows containing values for MolWeight column of less than 450 from
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
295 Sample1.csv and generate a new textfile NewSample1.csv, type:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
296 .PP
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
297 .Vb 3
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
298 \& % ExtractFromTextFiles.pl \-m rows \-\-rowsmode rowsbycolvalue
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
299 \& \-c collabel \-\-rows MolWeight,450,le \-r NewSample1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
300 \& \-o Sample1.csv
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
301 .Ve
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
302 .PP
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
303 To extract rows containing values for MolWeight column between 400 and 500 from
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
304 Sample1.csv and generate a new textfile NewSample1.csv, type:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
305 .PP
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
306 .Vb 3
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
307 \& % ExtractFromTextFiles.pl \-m rows \-\-rowsmode rowsbycolvaluerange
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
308 \& \-c collabel \-\-rows MolWeight,450,500 \-r NewSample1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
309 \& \-o Sample1.csv
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
310 .Ve
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
311 .PP
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
312 To extract a row containing minimum value for column MolWeight from Sample1.csv and generate
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
313 a new textfile NewSample1.csv, type:
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
314 .PP
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
315 .Vb 3
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
316 \& % ExtractFromTextFiles.pl \-m rows \-\-rowsmode rowbymincolvalue
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
317 \& \-c collabel \-\-rows MolWeight \-r NewSample1
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
318 \& \-o Sample1.csv
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
319 .Ve
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
320 .SH "AUTHOR"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
321 .IX Header "AUTHOR"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
322 Manish Sud <msud@san.rr.com>
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
323 .SH "SEE ALSO"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
324 .IX Header "SEE ALSO"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
325 JoinTextFiles.pl, MergeTextFilesWithSD.pl, ModifyTextFilesFormat.pl, SplitTextFiles.pl
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
326 .SH "COPYRIGHT"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
327 .IX Header "COPYRIGHT"
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
328 Copyright (C) 2015 Manish Sud. All rights reserved.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
329 .PP
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
330 This file is part of MayaChemTools.
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
331 .PP
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
332 MayaChemTools is free software; you can redistribute it and/or modify it under
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
333 the terms of the \s-1GNU\s0 Lesser General Public License as published by the Free
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
334 Software Foundation; either version 3 of the License, or (at your option)
4816e4a8ae95 Uploaded
deepakjadmin
parents:
diff changeset
335 any later version.