12345678910111213141516171819202122232425262728293031323334353637383940 |
- import os, chardet, codecs, argparse
- def WriteFile(filePath, u, encoding="utf-8"):
- with codecs.open(filePath, "w", encoding) as f:
- f.write(u)
- def GBK_2_UTF8(src, dst):
- # 检测编码,coding可能检测不到编码,有异常
- f = open(src, "rb")
- coding = chardet.detect(f.read())["encoding"]
- f.close()
- if coding != "utf-8":
- with codecs.open(src, "r", coding) as f:
- try:
- WriteFile(dst, f.read(), encoding="utf-8")
- try:
- print(src + " " + coding + " to utf-8 converted!")
- except Exception:
- print("print error")
- except Exception:
- print(src +" "+ coding+ " read error")
- # 把目录中的文件编码由gbk转换为utf-8
- def ReadDirectoryFile(rootdir):
- for parent, dirnames, filenames in os.walk(rootdir):
- for dirname in dirnames:
- #递归函数,遍历所有子文件夹
- ReadDirectoryFile(dirname)
- for filename in filenames:
- if filename.endswith(".c") or filename.endswith(".cpp") or filename.endswith(".bas"):
- GBK_2_UTF8(os.path.join(parent, filename),
- os.path.join(parent, filename))
- if __name__ == "__main__":
- parser = argparse.ArgumentParser(description="从指定目录读取文件")
- parser.add_argument("src_path", help="源目录的路径")
- args = parser.parse_args()
- ReadDirectoryFile(args.src_path)
|