webwml/wml2po.sh

261 lines
7.9 KiB
Bash
Raw Normal View History

2009-08-16 08:11:41 +00:00
#!/bin/bash
#
# Author: Runa Sandvik, <runa.sandvik@gmail.com>
# Google Summer of Code 2009
#
# This is Free Software (GPLv3)
# http://www.gnu.org/licenses/gpl-3.0.txt
#
# This script will convert all of the english wml files to po files, and
# keep them updated. The script will also convert subdirectories that
# exist in the english website module.
2009-08-16 08:11:41 +00:00
#
# For more information, see the HOWTO and README in
# translation/tools/gsoc09.
#
### start config ###
# Location of the wml files
wmldir="$PWD"
# Location of the po files.
2009-08-16 08:11:41 +00:00
# Assuming that the translation directory is relative to the website
podir="`dirname $wmldir`/translation/projects/website"
2009-08-16 08:11:41 +00:00
# Set the copyright holder of the po files,
2009-08-16 08:11:41 +00:00
# for example "The Tor Project, Inc"
copyright="The Tor Project, Inc"
# A lot of the wml files have custom tags. These tags have been defined
# in website/include/versions.wmi. Tags that people usually forget to close,
# as well as tags that are not defined in versions.wmi have been added.
# See: https://svn.torproject.org/svn/website/trunk/include/versions.wmi
customtag=`echo $(cat "$wmldir/include/versions.wmi" | awk '{ printf "<%s> " , $2 }' | sed 's/<>//g') "<svnsandbox> <svnwebsite> <svnprojects> <input> <hr> <br> <img> <gitblob> <version-android-components> <package-androidbundle-alpha> <package-androidbundle-alpha-sig> <version-androidbundle-tor>"`
2009-08-16 08:11:41 +00:00
# We also need to use the nodefault option of po4a; space separated list
# of tags that the module should not try to set by default in any
# category. For now, we only need the input tag.
nodefault='<input>'
# The script can write the name of unprocessed files to a log.
# If you want to enable this option, set the logfile here.
2010-08-09 20:39:40 +00:00
logfile="/home/runa/tor/wml2po.log"
2009-08-16 08:11:41 +00:00
# This is the temp logfile. Leave this line even if you don't want to
# log. This will be deleted when the script is done.
tmplog="`dirname $wmldir`/tmp.log"
### end config ###
# Create a lockfile to make sure that only one instance of the script
# can run at any time.
LOCKFILE=wml2po.lock
if lockfile -! -l 60 -r 3 "$LOCKFILE";
then
echo "unable to acquire lock" >2
exit 1
fi
trap "rm -f '$PWD/$LOCKFILE'" exit
# Check if translation/projects/website exist, i.e. has been checked out
if [ ! -d $podir ]
then
echo "Have you remembered to check out translation/projects/website?"
exit 1
fi
# If the logfile is set, write the date.
if [ $logfile ]
then
echo `date` > $logfile
fi
# Create the temp log
touch $tmplog
# We need to find out which language directories we have.
# We also need to excluse the website module directory itself, as well
# as .svn
langdir=`find "$podir" -maxdepth 1 -type d ! -path "$podir" ! -path "$podir/templates" ! -path "*\.*" | sed "s#$podir/##"`
2009-08-16 08:11:41 +00:00
# We only need the english wml files, but we do not wish to translate
# the eff documents.
wml=`find $wmldir -regex '^'$wmldir'/.*en/.*\.wml' -type f | grep -v '^'$wmldir'/eff'`
# For every language directory, create and/or update the po files.
for lang in $langdir ; do
2009-08-16 08:11:41 +00:00
# For every english wml, see if the po needs to be created or
# updated
for file in $wml ; do
2009-08-16 08:11:41 +00:00
# Get the basename of the file we are dealing with
wmlfile=`basename $file`
2009-08-16 08:11:41 +00:00
# Get the translation priority
priority=`cat $file | grep "# Translation-Priority" | awk '{print $3}'`
2009-08-16 08:11:41 +00:00
# If the file doesn't have a translation-priority, we can assume
# that it doesn't need to be translated. Skip this file and
# continue on with the next.
if [ ! $priority ]
then
continue
fi
# Strip the file for its original extension and add .po
pofile="$priority.${wmlfile%%.*}.po"
2009-08-16 08:11:41 +00:00
# Find out what directory the file is in.
# Also, remove the parth of the path that is $wmldir
indir=`dirname $file`
2009-08-16 08:11:41 +00:00
# We need to know what one dir up is
onedirup=`dirname $indir | sed "s#$wmldir/##"`
# We need to have the correct, full path to the po
# directory for the file we are working on.
# Also, did the subdirectory exist prior to running this
# script? If not, create it now and add it to the
# repository.
if [ $onedirup = $wmldir ]
then
popath="$podir/$lang"
else
# We need to know if a subdirectory, such as torbutton,
# exist in the translation module. If it does not exist,
# the script will create it in all the directories under
# translation/projects/website (excluding .svn)
subdir=`find "$podir/$lang" -maxdepth 1 -type d ! -path "$ppodir/$lang" ! -path "*\.*"`
for dir in $subdir ; do
if [ ! -d "$podir/$lang/$onedirup" ]
then
svn mkdir "$podir/$lang/$onedirup"
fi
done
# Set the path
popath="$podir/$lang/$onedirup"
fi
2009-08-16 08:11:41 +00:00
# Check to see if the po existed prior to running this
# script. If it didn't, check if there any files with the same
# filename, but different priority. If neither of the files
# exist, create with po4a-gettextize.
if [ -e "$popath/$pofile" ]
then
poexist=1
elif [ `find $popath -type f -name "*.$filename" | wc -l` -gt "0" ]
then
poexist=2
2009-08-16 08:11:41 +00:00
# We need to rename the other file
for file in `find $popath -type f -name "*.$filename"` ; do
svn mv "$file" "$popath/$pofile"
echo "$popath/$pofile" > $tmplog
done
else
poexist=0
fi
# If the po file does not exist, convert it with
# po4a-gettextize, set the right encoding and charset
# and the correct copyright.
if [ $poexist = 0 ]
2009-08-16 08:11:41 +00:00
then
# Convert it
po4a-gettextize -f wml -m "$file" -p "$popath/$pofile" --master-charset utf-8 -o customtag="$customtag" -o nodefault="$nodefault"
2009-08-16 08:11:41 +00:00
# Check to see if the file exists
if [ -e "$popath/$pofile" ]
2009-08-16 08:11:41 +00:00
then
# We don't want files without
# content, so check the file first.
content=`cat "$popath/$pofile" | grep '^#[.]' | wc -l`
# If the file does not have any
# content, delete it.
if [ $content = 0 ]
then
rm -f "$popath/$pofile"
echo "$popath/$pofile" > $tmplog
else
# Set the right encoding and charset, as well
# as the correct copyright holder.
sed -i '0,/ENCODING/ s/ENCODING/8bit/' "$popath/$pofile"
sed -i '0,/CHARSET/ s/CHARSET/utf-8/' "$popath/$pofile"
sed -i "0,/Free Software Foundation, Inc/ s/Free Software Foundation, Inc/$copyright/" "$popath/$pofile"
# And add it to the repository
svn add "$popath/$pofile"
echo "$popath/$pofile" > $tmplog
fi
fi
# Update the file with po4a-updatepo to make the
# word wrapping perfect
po4a-updatepo -f wml -m "$file" -p "$popath/$pofile" --master-charset utf-8 -o customtag="$customtag" -o nodefault="$nodefault"
# Delete the backup
rm -f "$popath/$pofile~"
fi
# If the po file does exist, calculate the hash first,
# then update the file, then calculate the hash again.
if [ $poexist = 1 ]
then
# Calculate the hash before we update the file
before=`grep -vE '^("POT-Creation-Date:|#)' "$popath/$pofile" | md5sum | cut -d " " -f1`
# Update the po file
po4a-updatepo -f wml -m "$file" -p "$popath/$pofile" --master-charset utf-8 -o customtag="$customtag" -o nodefault="$nodefault"
# Calculate the new hash
after=`grep -vE '^("POT-Creation-Date:|#)' "$popath/$pofile" | md5sum | cut -d " " -f1`
# Delete the backup
rm -f "$popath/$pofile~"
# Now we need to compare the before and after
# hash. If they match (i.e. nothing has
# changed), revert the file.
if [ $before = $after ]
then
svn revert "$popath/$pofile"
2009-08-16 08:11:41 +00:00
echo "$popath/$pofile" > $tmplog
else
echo "$popath/$pofile" > $tmplog
fi
fi
# If a file with the same name but different priority
# exist, then rename the file (we have done so already)
# and update it with po4a-updatepo to make sure
# everything else is ok.
if [ $poexist = 2 ]
2009-08-16 08:11:41 +00:00
then
# Update the file
po4a-updatepo -f wml -m "$file" -p "$popath/$pofile" --master-charset utf-8 -o customtag="$customtag" -o nodefault="$nodefault"
2009-08-16 08:11:41 +00:00
fi
# Write to the logfile
if [ -e $logfile ]
2009-08-16 08:11:41 +00:00
then
if [ `cat $tmplog | grep "$popath/$pofile" | wc -l` -eq "0" ]
then
echo "could not process: " "$file" >> $logfile
fi
2009-08-16 08:11:41 +00:00
fi
# Delete the temp log
rm -f $tmplog
done
2009-08-16 08:11:41 +00:00
done