From 1b2c8eb3b653ecc05e332be16a79e740cd679a9f Mon Sep 17 00:00:00 2001 From: Aaron LI Date: Tue, 27 Aug 2019 15:54:43 +0800 Subject: cli/unzip-gbk: Rewrite in shell and use bsdtar/7z * Rewrite in shell instead of using the deprecated Python 2. * Use bsdtar/7z to extract zip to preserve the filename encoding; these tools also support encrypted zip archives. * Use iconv to convert the filename encoding. --- cli/unzip-gbk.sh | 55 +++++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 55 insertions(+) create mode 100755 cli/unzip-gbk.sh (limited to 'cli/unzip-gbk.sh') diff --git a/cli/unzip-gbk.sh b/cli/unzip-gbk.sh new file mode 100755 index 0000000..53c7b57 --- /dev/null +++ b/cli/unzip-gbk.sh @@ -0,0 +1,55 @@ +#!/bin/sh +# +# Extract a zip archive and fix Chinese filenames. +# +# Credit: https://superuser.com/a/872616 +# + +has() { + type "$1" >/dev/null 2>&1 +} + +extract() { + if has bsdtar; then + # bsdtar provided by libarchive + bsdtar -xvf "$1" + elif has 7z; then + # 7z provided by p7zip + env LC_ALL=C 7z x "$1" + else + echo "ERROR: Neither bsdtar nor 7z found" >&2 + exit 1 + fi +} + +fixnames() { + find . -depth | while read -r p; do + dn=$(dirname "${p}") + fn=$(basename "${p}") + fn2=$(echo "${fn}" | iconv -f gbk -t utf-8) + if [ "${fn}" != "${fn2}" ]; then + mv -v "${dn}/${fn}" "${dn}/${fn2}" + fi + done +} + +case $1 in +'' | -h | --help) + echo "usage: ${0##*/} " + exit 1 + ;; +esac + +zipfile=$(realpath "$1") +curdir=$(pwd) +tmpdir=$(mktemp -d) +cd "${tmpdir}" + +echo "Extracting archive '${zipfile}' ..." +extract "${zipfile}" +echo "Fixing filenames ..." +fixnames + +cd "${curdir}" +mv "${tmpdir}"/* . +rmdir "${tmpdir}" -- cgit v1.2.2