使用python批量查看文件编码,或者批量修改文件编码
代码
#!/usr/bin/python
import os
import chardet
# 获得所有txt(根据个人需求更改)文件的路径,传入根目录路径
def find_all_file(path: str) -> str:
for root, dirs, files in os.walk(path):
for f in files:
if f.endswith('.txt'):#根据个人需求更改
fullname = os.path.join(root, f)
yield fullname
pass
pass
pass
# 判断是不是utf-8编码方式
def judge_coding(path: str) -> dict:
with open(path, 'rb') as f:
c = chardet.detect(f.read())
if c['encoding'] != 'utf-8':
return c
# 修改文件编码方式
def change_to_utf_file(path: str):
for i in find_all_file(path):
c = judge_coding(i)
if c:
change(i, c['encoding'])
print("{} 编码方式已从{}改为 utf-8".format(i, c['encoding']))
# 执行修改操作
def change(path: str, coding: str):
with open(path, 'r', encoding=coding) as f:
text = f.read()
with open(path, 'w', encoding='utf-8') as f:
f.write(text)
# 查看所有文件编码方式
def check(path: str):
for i in find_all_file(path):
with open(i, 'rb') as f:
print(chardet.detect(f.read())['encoding'], ': ', i)
def main():
my_path = 'D:/Project/python/Chardet/test'
#根据需求打开相应注释
#change_to_utf_file(my_path)#修改文件编码,修改的时候打开注释
#check(my_path)#查看文件编码,查看的时候打开注释
if __name__ == '__main__':
main()
结果
查看文件编码
image.png
执行编码转换
image.png
再次查看转换后的编码
image.png










网友评论