2019-07-11 05:53:40 +02:00
|
|
|
#!/bin/sh
|
|
|
|
|
|
|
|
# This script allows you to compare two epub, odt, or docx
|
|
|
|
# containers, ignoring insignificant formatting differences
|
|
|
|
# in the XML contents.
|
|
|
|
|
2019-07-17 18:21:41 +02:00
|
|
|
UNAME=$(uname)
|
|
|
|
if [ "$UNAME" = "Darwin" ]; then
|
|
|
|
FIND="find -E"
|
|
|
|
else
|
|
|
|
FIND="find -regextype posix-extended"
|
|
|
|
fi
|
|
|
|
|
2019-07-11 05:53:40 +02:00
|
|
|
f1="$1"
|
|
|
|
f2="$2"
|
|
|
|
test -f "$f1" -a -f "$f2" || {
|
|
|
|
echo "Usage: diff-zip firstfile secondfile" && exit 1
|
|
|
|
}
|
2019-07-12 18:08:27 +02:00
|
|
|
WORKDIR=$(mktemp -d -t diff-zip.XXX)
|
2019-07-11 05:53:40 +02:00
|
|
|
trap "{ rm -r $WORKDIR; }" EXIT
|
|
|
|
unzip -q -d "$WORKDIR/a" "$f1"
|
|
|
|
unzip -q -d "$WORKDIR/b" "$f2"
|
|
|
|
cd "$WORKDIR"
|
|
|
|
mkdir tidy
|
|
|
|
for x in a b; do
|
|
|
|
cp -r $x tidy/
|
2019-07-17 18:21:41 +02:00
|
|
|
$FIND $x -iregex '.*\.(xhtml|xml|rdf|rels)' -exec sh -c 'mkdir -p "$(dirname tidy/$1)" && tidy -q -xml -utf8 -i "$1" > "tidy/$1"' _ {} \;
|
2019-07-11 05:53:40 +02:00
|
|
|
done
|
|
|
|
cd tidy
|
|
|
|
mkdir c
|
|
|
|
cp -r a/* c/
|
|
|
|
cp -r b/* c/
|
2019-07-12 18:08:27 +02:00
|
|
|
find c -type f -exec sh -c 'echo -e "\033[1m=== ${1#*/} ===\033[0m" ; diff -u "a/${1#*/}" "b/${1#*/}" 2>&1' _ {} \;
|