Last active
August 24, 2019 13:02
-
-
Save jhandley/242f46c6c096fb18a4d375d46c0c9ee3 to your computer and use it in GitHub Desktop.
Change character encodings of a bunch of C++ source files
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/usr/bin/python | |
import sys, os, chardet | |
def main(argv): | |
if len(argv) < 3: | |
print("Usage: " + argv[0] + " <directory> encoding") | |
sys.exit(2) | |
root_dir = argv[1] | |
target_encoding = argv[2] | |
for root, dirnames, filenames in os.walk(root_dir): | |
for filename in filenames: | |
if filename.endswith(('.h', '.cpp', '.c', '.cc')): | |
source_file = os.path.join(root, filename) | |
source_encoding = chardet.detect(open(source_file, 'rb').read())['encoding'] | |
if source_encoding != target_encoding and source_encoding != 'ascii': | |
print("Convert ", source_file, " from ", source_encoding) | |
with open(source_file, 'r', encoding=source_encoding) as f: | |
try: | |
lines = f.readlines() | |
except: | |
print("ERROR reading file ", source_file, source_encoding) | |
raise | |
with open(source_file, 'w', encoding=target_encoding) as f: | |
try: | |
for line in lines: | |
f.write(line) | |
except: | |
print("ERROR writing file ", source_file, source_encoding) | |
raise | |
if __name__ == "__main__": | |
main(sys.argv) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment