| 1 |
#!/bin/bash
|
| 2 |
|
| 3 |
if [ "$1" = "--help" ]; then
|
| 4 |
echo "Usage: $0 lang"
|
| 5 |
exit 0
|
| 6 |
fi
|
| 7 |
|
| 8 |
language=${1:-en}
|
| 9 |
|
| 10 |
basedir="$(pwd)/$(dirname $0)"
|
| 11 |
TARGET="./integrated"
|
| 12 |
|
| 13 |
cd ./$language || exit 1
|
| 14 |
|
| 15 |
TEMPDIR=/tmp/merge_xml.$$
|
| 16 |
LOG=$TEMPDIR/merge_xml.$language.log
|
| 17 |
[[ -d $TEMPDIR ]] || mkdir $TEMPDIR
|
| 18 |
|
| 19 |
#<!ENTITY bookinfo.xml SYSTEM "en/bookinfo.xml">
|
| 20 |
OLD_IFS=$IFS
|
| 21 |
IFS="
|
| 22 |
"
|
| 23 |
:>$TEMPDIR/entlist
|
| 24 |
for ENT in `grep "<!ENTITY" ../build/docstruct.ent` ; do
|
| 25 |
echo -n "$(echo $ENT | sed "s/.*ENTITY\ *//" | sed "s/\ *SYSTEM.*$//")" >>$TEMPDIR/entlist
|
| 26 |
echo -n ":" >>$TEMPDIR/entlist
|
| 27 |
echo "$(echo $ENT | sed "s/.*SYSTEM\ *\"en\///" | sed "s/\">//")" >>$TEMPDIR/entlist
|
| 28 |
|
| 29 |
done
|
| 30 |
IFS=$OLD_IFS
|
| 31 |
|
| 32 |
# Make sure that all files are in UTF-8 first
|
| 33 |
# This is only necessary while we're converting translated files
|
| 34 |
echo "Converting .xml files to UTF-8..." >>$LOG
|
| 35 |
for FILE in `find . -name "*.xml"` ; do
|
| 36 |
DNAME=$(dirname $FILE); FNAME=$(basename $FILE)
|
| 37 |
mkdir -p $TEMPDIR/in/$DNAME
|
| 38 |
REGEXP="^<?.*encoding="
|
| 39 |
if egrep -q $REGEXP $FILE ; then
|
| 40 |
echo "Encoded : $FILE" >>$LOG
|
| 41 |
ENC=$(egrep $REGEXP $FILE | sed "s/.*xml.*encoding=\"//" | sed "s/\"?>//")
|
| 42 |
iconv -f $ENC -t utf-8 $FILE | egrep -v $REGEXP >$TEMPDIR/in/$DNAME/$FNAME
|
| 43 |
else
|
| 44 |
echo "Not encoded: $FILE" >>$LOG
|
| 45 |
cp $FILE $TEMPDIR/in/$DNAME/$FNAME
|
| 46 |
fi
|
| 47 |
done
|
| 48 |
echo "" >>$LOG
|
| 49 |
|
| 50 |
# Include lower level xml-files for all the main level xml-files
|
| 51 |
echo "Merging .xml files per 'chapter'..." >>$LOG
|
| 52 |
awk -v TARGET="$TEMPDIR" -v LOG=$LOG -v ENTLIST="$TEMPDIR/entlist" \
|
| 53 |
-f $basedir/merge_xml.awk ../build/install.${language}.xml
|
| 54 |
|
| 55 |
# Copy the results to their proper location
|
| 56 |
cd ..
|
| 57 |
TDIR="./integrated/$language"
|
| 58 |
[[ -d $TDIR ]] && rm $TDIR/*.xml || mkdir -p $TDIR
|
| 59 |
cp $TEMPDIR/*.xml $TARGET/$language
|
| 60 |
cp $LOG $TARGET/$language
|
| 61 |
|
| 62 |
rm -r $TEMPDIR
|
| 63 |
exit 0
|
| 64 |
|