import os
output_path = r'./data_erji_utf8'
def gbk_to_utf8(path):
"""
将GBK编码的文件转换为UTF-8编码
:param path: 文件路径
:return: None
"""
# 获取文件列表
file_list = os.listdir(path)
for file_name in file_list:
# 拼接文件路径
file_path = os.path.join(path, file_name)
print(file_path)
# 判断是否为文件
if os.path.isfile(file_path):
# 打开文件
with open(file_path, 'rb') as f:
# 读取文件内容
gbk_content = f.read()
utf8_content = gbk_content.decode('gbk').encode('utf-8')
# 保存文件
with open(os.path.join(output_path, file_name), 'wb') as f:
f.write(utf8_content)
if __name__ == '__main__':
gbk_to_utf8('./data_erji')
暂无评论