annotate convert_characters.pl @ 2:c58a4238167e default tip

version 2
author greg
date Fri, 05 Aug 2011 16:33:29 -0400
parents 21b1788b85a4
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
21b1788b85a4 Version 1
greg
parents:
diff changeset
1 #! /usr/bin/perl -w
21b1788b85a4 Version 1
greg
parents:
diff changeset
2
21b1788b85a4 Version 1
greg
parents:
diff changeset
3 use strict;
21b1788b85a4 Version 1
greg
parents:
diff changeset
4 use warnings;
21b1788b85a4 Version 1
greg
parents:
diff changeset
5
21b1788b85a4 Version 1
greg
parents:
diff changeset
6 # converts all characters of one type into another
21b1788b85a4 Version 1
greg
parents:
diff changeset
7 # convert_characters.pl [input] [convert_from] [convert_to] [output]
21b1788b85a4 Version 1
greg
parents:
diff changeset
8
21b1788b85a4 Version 1
greg
parents:
diff changeset
9 die "Check argument\n" unless @ARGV == 4;
21b1788b85a4 Version 1
greg
parents:
diff changeset
10
21b1788b85a4 Version 1
greg
parents:
diff changeset
11 my $inputfile = $ARGV[0];
21b1788b85a4 Version 1
greg
parents:
diff changeset
12 my $convert_from = $ARGV[1];
21b1788b85a4 Version 1
greg
parents:
diff changeset
13 my $convert_to = $ARGV[2];
21b1788b85a4 Version 1
greg
parents:
diff changeset
14 my $outputfile = $ARGV[3];
21b1788b85a4 Version 1
greg
parents:
diff changeset
15
21b1788b85a4 Version 1
greg
parents:
diff changeset
16 if ($convert_from eq "s")
21b1788b85a4 Version 1
greg
parents:
diff changeset
17 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
18 $convert_from = '\s';
21b1788b85a4 Version 1
greg
parents:
diff changeset
19 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
20 elsif ($convert_from eq "T")
21b1788b85a4 Version 1
greg
parents:
diff changeset
21 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
22 $convert_from = '\t';
21b1788b85a4 Version 1
greg
parents:
diff changeset
23 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
24 elsif ($convert_from eq "Sp")
21b1788b85a4 Version 1
greg
parents:
diff changeset
25 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
26 $convert_from = '\s';
21b1788b85a4 Version 1
greg
parents:
diff changeset
27 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
28 elsif ($convert_from eq "Dt")
21b1788b85a4 Version 1
greg
parents:
diff changeset
29 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
30 $convert_from = '\.';
21b1788b85a4 Version 1
greg
parents:
diff changeset
31 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
32 elsif ($convert_from eq "C")
21b1788b85a4 Version 1
greg
parents:
diff changeset
33 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
34 $convert_from = ",";
21b1788b85a4 Version 1
greg
parents:
diff changeset
35 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
36 elsif ($convert_from eq "D")
21b1788b85a4 Version 1
greg
parents:
diff changeset
37 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
38 $convert_from = "-";
21b1788b85a4 Version 1
greg
parents:
diff changeset
39 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
40 elsif ($convert_from eq "U")
21b1788b85a4 Version 1
greg
parents:
diff changeset
41 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
42 $convert_from = "_";
21b1788b85a4 Version 1
greg
parents:
diff changeset
43 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
44 elsif ($convert_from eq "P")
21b1788b85a4 Version 1
greg
parents:
diff changeset
45 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
46 $convert_from = '\|';
21b1788b85a4 Version 1
greg
parents:
diff changeset
47 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
48 else
21b1788b85a4 Version 1
greg
parents:
diff changeset
49 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
50 die "Invalid value specified for convert from\n";
21b1788b85a4 Version 1
greg
parents:
diff changeset
51 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
52
21b1788b85a4 Version 1
greg
parents:
diff changeset
53
21b1788b85a4 Version 1
greg
parents:
diff changeset
54 if ($convert_to eq "T")
21b1788b85a4 Version 1
greg
parents:
diff changeset
55 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
56 $convert_to = "\t";
21b1788b85a4 Version 1
greg
parents:
diff changeset
57 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
58 elsif ($convert_to eq "Sp")
21b1788b85a4 Version 1
greg
parents:
diff changeset
59 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
60 $convert_to = '\s';
21b1788b85a4 Version 1
greg
parents:
diff changeset
61 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
62 elsif ($convert_to eq "Dt")
21b1788b85a4 Version 1
greg
parents:
diff changeset
63 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
64 $convert_to = "\.";
21b1788b85a4 Version 1
greg
parents:
diff changeset
65 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
66 elsif ($convert_to eq "C")
21b1788b85a4 Version 1
greg
parents:
diff changeset
67 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
68 $convert_to = ",";
21b1788b85a4 Version 1
greg
parents:
diff changeset
69 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
70 elsif ($convert_to eq "D")
21b1788b85a4 Version 1
greg
parents:
diff changeset
71 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
72 $convert_to = "-";
21b1788b85a4 Version 1
greg
parents:
diff changeset
73 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
74 elsif ($convert_to eq "U")
21b1788b85a4 Version 1
greg
parents:
diff changeset
75 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
76 $convert_to = "_";
21b1788b85a4 Version 1
greg
parents:
diff changeset
77 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
78 elsif ($convert_to eq "P")
21b1788b85a4 Version 1
greg
parents:
diff changeset
79 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
80 $convert_to = "|";
21b1788b85a4 Version 1
greg
parents:
diff changeset
81 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
82 else
21b1788b85a4 Version 1
greg
parents:
diff changeset
83 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
84 die "Invalid value specified for convert to\n";
21b1788b85a4 Version 1
greg
parents:
diff changeset
85 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
86
21b1788b85a4 Version 1
greg
parents:
diff changeset
87 my $fhIn;
21b1788b85a4 Version 1
greg
parents:
diff changeset
88 open ($fhIn, "< $inputfile") or die "Cannot open source file";
21b1788b85a4 Version 1
greg
parents:
diff changeset
89
21b1788b85a4 Version 1
greg
parents:
diff changeset
90 my $fhOut;
21b1788b85a4 Version 1
greg
parents:
diff changeset
91 open ($fhOut, "> $outputfile");
21b1788b85a4 Version 1
greg
parents:
diff changeset
92
21b1788b85a4 Version 1
greg
parents:
diff changeset
93 while (<$fhIn>)
21b1788b85a4 Version 1
greg
parents:
diff changeset
94 {
21b1788b85a4 Version 1
greg
parents:
diff changeset
95 my $thisLine = $_;
21b1788b85a4 Version 1
greg
parents:
diff changeset
96 chomp $thisLine;
21b1788b85a4 Version 1
greg
parents:
diff changeset
97 $thisLine =~ s/$convert_from{1,}/$convert_to/g;
21b1788b85a4 Version 1
greg
parents:
diff changeset
98 print $fhOut $thisLine,"\n";
21b1788b85a4 Version 1
greg
parents:
diff changeset
99 }
21b1788b85a4 Version 1
greg
parents:
diff changeset
100 close ($fhIn) or die "Cannot close source file\n";
21b1788b85a4 Version 1
greg
parents:
diff changeset
101 close ($fhOut) or die "Cannot close output fil\n";