UTF-8 encoding errors of files
Aus Wiki
# -*- coding: utf-8 -*-
import os
import sys
from chardet import detect
def get_encoding_type(file):
with open(file, 'rb') as f:
rawdata = f.read()
return detect(rawdata)['encoding']
files = sorted(os.listdir('.'))
for filename in files:
print (filename)
print (get_encoding_type(filename))
input = open(filename,'r', encoding=get_encoding_type(filename))
data = input.read()
input.close()
output = open(filename,'w', encoding='utf-8')
output.write(data)
output.close()