UTF-8 encoding errors of files
Aus Wiki
Version vom 23. Oktober 2023, 06:38 Uhr von 129.187.36.61 (Diskussion) (Die Seite wurde neu angelegt: „ # -*- coding: utf-8 -*- import os import sys from chardet import detect def get_encoding_type(file): with open(file, 'rb') as f: rawdata = f.read()…“)
# -*- coding: utf-8 -*-
import os
import sys
from chardet import detect
def get_encoding_type(file):
with open(file, 'rb') as f:
rawdata = f.read()
return detect(rawdata)['encoding']
files = sorted(os.listdir('.'))
for filename in files:
print (filename)
print (get_encoding_type(filename))
input = open(filename,'r', encoding=get_encoding_type(filename))
data = input.read()
input.close()
output = open(filename,'w', encoding='utf-8')
output.write(data)
output.close()