annotate directory_copier.py @ 1:1487421505f1 draft

Uploaded correct tool this time
author brenninc
date Wed, 23 Mar 2016 12:08:33 -0400
parents 25b07ce180d4
children 3911ee1a0078
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
1 import gzip
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
2 import optparse # using optparse as hydra still python 2.6
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
3 import os.path
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
4 import shutil
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
5 import sys
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
6
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
7 def report_error(*args):
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
8 sys.stderr.write(' '.join(map(str,args)) + '\n')
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
9 sys.stderr.flush()
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
10 sys.exit(1)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
11
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
12
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
13 def check_pattern_get_new_name(a_file, ending, options):
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
14 if options.start:
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
15 if not(a_file.startswith(options.start)):
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
16 return None
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
17 if options.last:
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
18 if ending[0] == ".":
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
19 last = options.last + ending
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
20 else:
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
21 if options.last[-1] == ".":
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
22 last = options.last + ending
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
23 else:
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
24 last = options.last + "." + ending
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
25 if not(a_file.endswith(last)):
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
26 return None
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
27 if options.new_ending:
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
28 name = a_file[:-len(ending)]
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
29 if options.new_ending[0] ==".":
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
30 if name[-1] == ".":
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
31 name = name[:-1]
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
32 return name + options.new_ending
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
33 if options.decompress:
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
34 if a_file.endswith(".gz"):
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
35 return a_file[:-3]
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
36 return a_file
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
37
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
38
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
39 def check_and_get_new_name(a_file, options):
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
40 for ending in options.endings:
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
41 if a_file.endswith(ending):
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
42 return check_pattern_get_new_name (a_file, ending, options)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
43 return None
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
44
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
45
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
46 def link(a_file, new_name, path):
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
47 file_path = os.path.join(os.path.realpath(path), a_file)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
48 sym_path = os.path.join(os.path.realpath("output"), new_name)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
49 #if not(os.path.exists(sym_path)):
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
50 os.link(file_path, sym_path)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
51
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
52
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
53 def decompress(a_file, new_name, path):
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
54 file_path = os.path.join(os.path.realpath(path), a_file)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
55 target_path = os.path.join(os.path.realpath("output"), new_name)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
56 with gzip.open(file_path, 'rb') as f_in, open(target_path, 'wb') as f_out:
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
57 shutil.copyfileobj(f_in, f_out)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
58
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
59
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
60 def copy_and_link(path, options):
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
61 os.mkdir("output")
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
62 with open(options.list, 'w') as list_file:
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
63 files = os.listdir(path)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
64 files.sort()
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
65 for a_file in files:
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
66 new_name = check_and_get_new_name(a_file, options)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
67 if new_name:
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
68 list_file.write(new_name)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
69 list_file.write("\n")
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
70 if options.decompress:
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
71 if a_file.endswith(".gz"):
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
72 decompress(a_file, new_name,path)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
73 else:
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
74 link(a_file, new_name, path)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
75 elif options.link:
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
76 link(a_file, new_name, path)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
77
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
78
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
79 if __name__ == '__main__':
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
80 parser = optparse.OptionParser()
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
81 parser.add_option("--path", action="store", type="string",
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
82 help="Path of directory to check. ")
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
83 parser.add_option("--ending", action="append", type="string", dest="endings",
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
84 help="Ending that can be listed and if requested linked or decompressed. ")
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
85 parser.add_option("--start", action="store", type="string",
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
86 help="String that must be at the start of the file name ")
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
87 parser.add_option("--last", action="store", type="string",
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
88 help="String that must be the last bit of the file name before the endings")
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
89 parser.add_option("--new_ending", action="store", type="string",
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
90 help="New ending to replace any previous ending in list and if required links or decompressions. Note: If not set decompression will auto remove the compressioned part of the ending")
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
91 #parser.add_option("--regex", action="store", type="string",
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
92 # help="Regex pattern the file name (less . ending) must match before the endings")
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
93 parser.add_option("--list", action="store", type="string",
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
94 help="Path to where all files should be listed. ")
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
95 parser.add_option("--link", action="store_true", default=False,
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
96 help="If set will cause links to be added in output directory. ")
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
97 parser.add_option("--decompress", action="store_true", default=False,
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
98 help="If set will cause gz files to be decompressed or if not a supported decompression ending linked.")
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
99 (options, args) = parser.parse_args()
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
100
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
101
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
102 path = options.path.strip()
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
103 if path[-1] != '/':
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
104 path = path + "/"
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
105 copy_and_link(path, options)
25b07ce180d4 Uploaded first version
brenninc
parents:
diff changeset
106