Files
Upsilon/apps/reader/normalize.py
2020-11-21 19:29:46 +01:00

19 lines
428 B
Python

import sys
import unicodedata
import argparse
import io
import shutil
filename = sys.argv[1]
print("Normalization of "+filename)
output = open(filename+".tmp", "wb")
with io.open(filename, "r", encoding='utf-8') as file:
for line in file:
unicodeLine = unicodedata.normalize("NFKD", line)
output.write(unicodeLine.encode("UTF-8"))
output.close()
shutil.move(filename+".tmp",filename)