forked from ziyuang/mincemeatpy
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathfileiter.py
47 lines (39 loc) · 1.56 KB
/
fileiter.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
from itertools import islice
import optparse
import os
def read(filename, n=20):
# if you get UnicodeDecodingError below, try specifying utf-8 as encoding method
with open(filename, 'r') as f:
while True:
lines = ''.join([line for line in islice(f, n)])
if lines == '':
break
yield lines
def split_file(dir, filename, n=4):
f = read(filename)
dirname = "%s/%s_split_%d" % (dir, filename, n)
try:
print(dirname)
os.makedirs(dirname)
except FileExistsError:
print("file already processed, please delete the directory before resplit")
return
files = [open("%s/%s_%d" % (dirname, filename, i), 'w') for i in range(n)]
for i, line in enumerate(f):
files[i % n].write(line)
for f in files:
f.close()
def splitter_options_parse():
parser = optparse.OptionParser(usage='%prog [options]', version='%%prog %s' % '0.0.1')
parser.add_option('-f', '--filename', dest='filename', default='', help='name of input file')
parser.add_option('-n', '--number_of_splits', dest='number_of_splits', default='4',
help='number of splits')
parser.add_option('-d', '--dir', dest='dirname', default='windows', help='destination directory')
return parser
if __name__ == '__main__':
parser = splitter_options_parse()
(options, args) = parser.parse_args()
if options.filename == "":
print("please enter file name")
else:
split_file(options.dirname, options.filename, int(options.number_of_splits))