UTF-8 encoding errors of files

Aus Wiki
Wechseln zu: Navigation, Suche
# -*- coding: utf-8 -*-
import os
import sys
from chardet import detect

def get_encoding_type(file):
	with open(file, 'rb') as f:
		rawdata = f.read()
	return detect(rawdata)['encoding']

files = sorted(os.listdir('.'))
for filename in files:
	print (filename)
	print (get_encoding_type(filename))

	input = open(filename,'r', encoding=get_encoding_type(filename))
	data = input.read()
	input.close()

	output = open(filename,'w', encoding='utf-8')
	output.write(data)
	output.close()