Last active
October 18, 2016 08:53
-
-
Save xerz-one/c681befd02a2afe8fe60ebebac234a7b to your computer and use it in GitHub Desktop.
A script that destroys Windows-1252 garbage - with garbage!
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
/* | |
Ungarbage v0.1.0.1 | |
October 18th 2016, @espectalll | |
To the extent possible under law, the author has dedicated all copyright and related and neighboring rights | |
to this software to the public domain worldwide. This software is distributed without any warranty. | |
You should have received a copy of the CC0 Public Domain Dedication along with this software. If not, see | |
<http://creativecommons.org/publicdomain/zero/1.0/>. | |
*/ | |
import java.io.File | |
import java.nio.charset.Charset | |
import java.nio.file.Files | |
fun findFiles(dir: File): MutableList<File> { | |
var files: MutableList<File> = arrayListOf() | |
for(child in dir.listFiles()) { | |
var childPath = child.toString() | |
when { | |
child.isDirectory -> files.addAll(findFiles(child)) | |
childPath.endsWith(".html") || childPath.endsWith(".htm") -> files.add(child) | |
} | |
} | |
return files | |
} | |
fun replaceBad(data: List<String>): List<String> { | |
var data = data.toMutableList() | |
var blacklist = mapOf('á' to "á", 'é' to "é", 'í' to "í", 'ó' to "ó", 'ú' to "ú", | |
'Á' to "Á", 'É' to "É", 'Í' to "Í", 'Ó' to "Ó", 'Ú' to "Ú", | |
'ñ' to "ñ", 'Ñ' to "Ñ") | |
for (i in 0..data.size - 1) { | |
for (char in data[i]) { | |
if (blacklist[char] != null) { | |
data[i] = data[i].replace(char.toString(), blacklist[char].toString()) | |
} | |
} | |
} | |
return data | |
} | |
fun main(args: Array<String>) { | |
var files = findFiles(File(".")) | |
for (file in files) { | |
var data = file.readLines(Charset.forName("windows-1252")) | |
Files.write(file.toPath(), replaceBad(data), Charsets.UTF_8) | |
} | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment