#!/usr/bin/env python import sys, unicodedata if __name__ == '__main__': if len(sys.argv) != 2: sys.exit(1) filename = sys.argv[1] f = open(filename, 'r') ori = unicode(f.read(), 'utf-8') res = unicodedata.normalize('NFC', ori).encode('utf-8') f.close print res,