summaryrefslogtreecommitdiffstats
path: root/util
diff options
context:
space:
mode:
authorRichard Levitte <levitte@openssl.org>2015-07-13 16:50:16 +0200
committerRichard Levitte <levitte@openssl.org>2015-07-14 01:10:01 +0200
commitf608b4064d58ca4dfdfdfc921308b51cb96205e2 (patch)
tree310a006f58c74c77288a85fff996ff753ae48694 /util
parenteeb97bce751296b2e04a92d00c0d0a792ba61834 (diff)
Small script to re-encode files that need it to UTF-8
This requires 'iconv' and that 'file' can take the options '-b' and '-i'. Reviewed-by: Rich Salz <rsalz@openssl.org>
Diffstat (limited to 'util')
-rw-r--r--util/toutf8.sh17
1 files changed, 17 insertions, 0 deletions
diff --git a/util/toutf8.sh b/util/toutf8.sh
new file mode 100644
index 0000000000..8a4254b3df
--- /dev/null
+++ b/util/toutf8.sh
@@ -0,0 +1,17 @@
+#! /bin/sh
+#
+# Very simple script to detect and convert files that we want to re-encode to UTF8
+
+git ls-tree -r --name-only HEAD | \
+ while read F; do
+ charset=`file -bi "$F" | sed -e 's|.*charset=||'`
+ if [ "$charset" != "utf-8" -a "$charset" != "binary" -a "$charset" != "us-ascii" ]; then
+ iconv -f ISO-8859-1 -t UTF8 < "$F" > "$F.utf8" && \
+ ( cmp -s "$F" "$F.utf8" || \
+ ( echo "$F"
+ mv "$F" "$F.iso-8859-1"
+ mv "$F.utf8" "$F"
+ )
+ )
+ fi
+ done