|
@@ -19,20 +19,19 @@ from difflib import unified_diff
|
|
|
fns = sys.argv[1:]
|
|
|
|
|
|
translate = {
|
|
|
-
|
|
|
- '\r': '',
|
|
|
+ '\r': None,
|
|
|
'\b': '[BS]',
|
|
|
|
|
|
}
|
|
|
|
|
|
def cleanup_file(fn):
|
|
|
|
|
|
- with open(fn) as fp:
|
|
|
- data = fp.read()
|
|
|
+
|
|
|
+ with open(fn,'rb') as fp:
|
|
|
+ data = fp.read().decode()
|
|
|
|
|
|
def gen_text():
|
|
|
- for line in data.splitlines():
|
|
|
-
|
|
|
+ for line in data.split('\n'):
|
|
|
line = line.translate({ord(a):b for a,b in translate.items()})
|
|
|
line = re.sub(r'\s+$','',line)
|
|
|
yield line
|