UTF-8 encoding errors of files

Aus Wiki
Version vom 23. Oktober 2023, 06:38 Uhr von 129.187.36.61 (Diskussion) (Die Seite wurde neu angelegt: „ # -*- coding: utf-8 -*- import os import sys from chardet import detect def get_encoding_type(file): with open(file, 'rb') as f: rawdata = f.read()…“)
(Unterschied) ← Nächstältere Version | Aktuelle Version (Unterschied) | Nächstjüngere Version → (Unterschied)
Wechseln zu: Navigation, Suche
# -*- coding: utf-8 -*-
import os
import sys
from chardet import detect

def get_encoding_type(file):
	with open(file, 'rb') as f:
		rawdata = f.read()
	return detect(rawdata)['encoding']

files = sorted(os.listdir('.'))
for filename in files:
	print (filename)
	print (get_encoding_type(filename))

	input = open(filename,'r', encoding=get_encoding_type(filename))
	data = input.read()
	input.close()

	output = open(filename,'w', encoding='utf-8')
	output.write(data)
	output.close()