Prusa-Firmware/lang/lang-import.sh
2022-02-22 06:58:37 +01:00

480 lines
16 KiB
Bash
Executable File

#!/bin/bash
#
# Version 1.0.1 Build 36
#
# lang-import.sh - multi-language support script
# for importing translated xx.po
#
#############################################################################
# Change log:
# 9 Nov. 2018, XPila, Initial
# 21 Nov. 2018, XPila, fix - replace '\n' with space in all languages
# 10 Dec. 2018, jhoblitt, make all shell scripts executable
# 21 Aug. 2019, 3d-gussner, Added "All" argument and it is default in nothing is chosen
# Added few German/French diacritical characters
# 6 Sep. 2019, DRracer, change to bash
# 14 Sep. 2019, 3d-gussner, Prepare adding new language
# 1 Mar. 2019, 3d-gussner, Move `Dutch` language parts
# Add templates for future community languages
# 17 Dec. 2021, 3d-gussner, Use one config file for all languages
# Fix missing last translation
# Add counter
# replace two double quotes with `\x00`
# 21 Dec. 2021, 3d-gussner, Add Swedish, Danish, Slovanian, Hungarian,
# Luxembourgish, Croatian
# 3 Jan. 2022, 3d-gussner, Add Lithuanian
# Cleanup outaded code
# 11 Jan. 2022, 3d-gussner, Added version and Change log
# colored output
# Add Community language support
# Use `git rev-list --count HEAD lang-import.sh`
# to get Build Nr
# 14 Jan. 2022, 3d-gussner, Replace German UTF-8 'äöÿÿ' to HD44780 A00 ROM 'äöÿÿ'
# 28 Jan. 2022, 3d-gussner, Run lang-check and output `xx-output.txt` file to review
# translations
# new argruments `--information` `--import-check`
# 11 Jan. 2022, ingbrzy, Add Slovak letters
# 11 Feb. 2022, 3d-gussner, Change to python3
# 14 Feb. 2022, 3d-gussner, Replace non-block space with space
# Fix single language run without config.sh OK
#############################################################################
echo "$(tput setaf 2)lang-import.sh started$(tput sgr 0)" >&2
LNG=$1
# if no arguments, 'all' is selected (all po and also pot will be generated)
if [ -z "$LNG" ]; then
LNG=all;
# Config:
if [ -z "$CONFIG_OK" ]; then eval "$(cat config.sh)"; fi
if [ -z "$CONFIG_OK" ] | [ $CONFIG_OK -eq 0 ]; then echo "$(tput setaf 1)Config NG!$(tput sgr 0)" >&2; exit 1; fi
fi
if [[ ! -z "$COMMUNITY_LANGUAGES" && "$LNG" = "all" ]]; then
LANGUAGES+=" $COMMUNITY_LANGUAGES"
else
LANGUAGES="$LNG"
fi
echo "$(tput setaf 2)lang-import languages:$LANGUAGES$(tput sgr 0)" >&2
# if 'all' is selected, script will generate all po files and also pot file
if [ "$LNG" = "all" ]; then
for lang in $LANGUAGES; do
./lang-import.sh $lang
done
exit 0
fi
# language code (iso639-1) is equal to LNG
LNGISO=$LNG
# exception for 'cz' (code='cs')
if [ "$LNG" = "cz" ]; then LNGISO=cs; fi
# cd to input folder
cd po/new
# check if input file exists
if ! [ -e $LNGISO.po ]; then
echo "$(tput setaf 1)Input file $LNGISO.po not found!$(tput sgr 0)" >&2
exit -1
fi
#convert '\\e' sequencies to 'x1b' and '\\' to '\'
cat $LNGISO.po | sed 's/\\e/\\x1b/g;s/\\\\/\\/g' > $LNG'_filtered.po'
#replace '\n' with ' ' (single space)
sed -i 's/ \\n/ /g;s/\\n/ /g' $LNG'_filtered.po'
#replace in czech translation
if [ "$LNG" = "cz" ]; then
#replace 'Á' with 'A'
sed -i 's/\xc3\x81/A/g' $LNG'_filtered.po'
#replace 'á' with 'a'
sed -i 's/\xc3\xa1/a/g' $LNG'_filtered.po'
#replace 'Č' with 'C'
sed -i 's/\xc4\x8c/C/g' $LNG'_filtered.po'
#replace 'č' with 'c'
sed -i 's/\xc4\x8d/c/g' $LNG'_filtered.po'
#replace 'Ď' with 'D'
sed -i 's/\xc4\x8e/D/g' $LNG'_filtered.po'
#replace 'ď' with 'd'
sed -i 's/\xc4\x8f/d/g' $LNG'_filtered.po'
#replace 'É' with 'E'
sed -i 's/\xc3\x89/E/g' $LNG'_filtered.po'
#replace 'é' with 'e'
sed -i 's/\xc3\xa9/e/g' $LNG'_filtered.po'
#replace 'Ě' with 'E'
sed -i 's/\xc4\x9a/E/g' $LNG'_filtered.po'
#replace 'ě' with 'e'
sed -i 's/\xc4\x9b/e/g' $LNG'_filtered.po'
#replace 'Í' with 'I'
sed -i 's/\xc3\x8d/I/g' $LNG'_filtered.po'
#replace 'í' with 'i'
sed -i 's/\xc3\xad/i/g' $LNG'_filtered.po'
#replace 'Ň' with 'N'
sed -i 's/\xc5\x87/N/g' $LNG'_filtered.po'
#replace 'ň' with 'n'
sed -i 's/\xc5\x88/n/g' $LNG'_filtered.po'
#replace 'Ó' with 'O'
sed -i 's/\xc3\x93/O/g' $LNG'_filtered.po'
#replace 'ó' with 'o'
sed -i 's/\xc3\xb3/o/g' $LNG'_filtered.po'
#replace 'Ř' with 'R'
sed -i 's/\xc5\x98/R/g' $LNG'_filtered.po'
#replace 'ř' with 'r'
sed -i 's/\xc5\x99/r/g' $LNG'_filtered.po'
#replace 'Š' with 'S'
sed -i 's/\xc5\xa0/S/g' $LNG'_filtered.po'
#replace 'š' with 's'
sed -i 's/\xc5\xa1/s/g' $LNG'_filtered.po'
#replace 'Ť' with 'T'
sed -i 's/\xc5\xa4/T/g' $LNG'_filtered.po'
#replace 'ť' with 't'
sed -i 's/\xc5\xa5/t/g' $LNG'_filtered.po'
#replace 'Ú' with 'U'
sed -i 's/\xc3\x9a/U/g' $LNG'_filtered.po'
#replace 'ú' with 'u'
sed -i 's/\xc3\xba/u/g' $LNG'_filtered.po'
#replace 'Ů' with 'U'
sed -i 's/\xc5\xae/U/g' $LNG'_filtered.po'
#replace 'ů' with 'u'
sed -i 's/\xc5\xaf/u/g' $LNG'_filtered.po'
#replace 'Ý' with 'Y'
sed -i 's/\xc3\x9d/Y/g' $LNG'_filtered.po'
#replace 'ý' with 'y'
sed -i 's/\xc3\xbd/y/g' $LNG'_filtered.po'
#replace 'Ž' with 'Z'
sed -i 's/\xc5\xbd/Z/g' $LNG'_filtered.po'
#replace 'ž' with 'z'
sed -i 's/\xc5\xbe/z/g' $LNG'_filtered.po'
fi
#replace in German translation https://en.wikipedia.org/wiki/German_orthography
#replace in Swedish as well
if [[ "$LNG" = "de" || "$LNG" = "sv" ]]; then
#replace UTF-8 'äöüß' to HD44780 A00 'äöüß'
#replace 'ä' with 'A00 ROM ä'
sed -i 's/\xc3\xa4/\\xe1/g' $LNG'_filtered.po'
#replace 'Ä' with 'A00 ROM ä'
sed -i 's/\xc3\x84/\\xe1/g' $LNG'_filtered.po'
#replace 'ü' with 'A00 ROM ü'
sed -i 's/\xc3\xbc/\\xf5/g' $LNG'_filtered.po'
#replace 'Ü' with 'A00 ROM ü'
sed -i 's/\xc3\x9c/\\xf5/g' $LNG'_filtered.po'
#replace 'ö' with 'A00 ROM ö'
sed -i 's/\xc3\xb6/\\xef/g' $LNG'_filtered.po'
#replace 'Ö' with 'A00 ROM ö'
sed -i 's/\xc3\x96/\\xef/g' $LNG'_filtered.po'
#replace 'ß' with 'A00 ROM ß'
sed -i 's/\xc3\x9f/\\xe2/g' $LNG'_filtered.po'
fi
#replace in spain translation
if [ "$LNG" = "es" ]; then
#replace 'á' with 'a'
sed -i 's/\xc3\xa1/a/g' $LNG'_filtered.po'
#replace '¿' with '?'
sed -i 's/\xc2\xbf/?/g' $LNG'_filtered.po'
#replace 'ó' with 'o'
sed -i 's/\xc3\xb3/o/g' $LNG'_filtered.po'
#replace 'é' with 'e'
sed -i 's/\xc3\xa9/e/g' $LNG'_filtered.po'
#replace 'í' with 'i'
sed -i 's/\xc3\xad/i/g' $LNG'_filtered.po'
#replace '!' with '!'
sed -i 's/\xc2\xa1/!/g' $LNG'_filtered.po'
#replace 'n~' with 'n'
sed -i 's/\xc3\xb1/n/g' $LNG'_filtered.po'
fi
#replace in french translation https://en.wikipedia.org/wiki/French_orthography
if [ "$LNG" = "fr" ]; then
#replace 'á' with 'a' (right)
sed -i 's/\xc3\xa1/a/g' $LNG'_filtered.po'
#replace 'Á' with 'A' (right)
sed -i 's/\xc3\x81/A/g' $LNG'_filtered.po'
#replace 'à' with 'a' (left)
sed -i 's/\xc3\xa0/a/g' $LNG'_filtered.po'
#replace 'À' with 'A' (left)
sed -i 's/\xc3\x80/A/g' $LNG'_filtered.po'
#replace 'é' with 'e' (right)
sed -i 's/\xc3\xa9/e/g' $LNG'_filtered.po'
#replace 'É' with 'E' (right)
sed -i 's/\xc3\x89/E/g' $LNG'_filtered.po'
#replace 'è' with 'e' (left)
sed -i 's/\xc3\xa8/e/g' $LNG'_filtered.po'
#replace 'È' with 'E' (left)
sed -i 's/\xc3\x88/E/g' $LNG'_filtered.po'
fi
#replace in italian translation
if [ "$LNG" = "it" ]; then
#replace 'é' with 'e' (left)
sed -i 's/\xc3\xa8/e/g' $LNG'_filtered.po'
#replace 'á' with 'a' (left)
sed -i 's/\xc3\xa0/a/g' $LNG'_filtered.po'
#replace 'ó' with 'o' (left)
sed -i 's/\xc3\xb2/o/g' $LNG'_filtered.po'
#replace 'ú' with 'u' (left)
sed -i 's/\xc3\xb9/u/g' $LNG'_filtered.po'
#replace 'é' with 'e'
sed -i 's/\xc3\xa9/e/g' $LNG'_filtered.po'
#replace 'É' with 'E' (left)
sed -i 's/\xc3\x88/E/g' $LNG'_filtered.po'
fi
#replace in dutch translation according to https://nl.wikipedia.org/wiki/Accenttekens_in_de_Nederlandse_spelling
if [ "$LNG" = "nl" ]; then
#replace 'ë' with 'e'
sed -i 's/\xc3\xab/e/g' $LNG'_filtered.po'
#replace 'ï' with 'i'
sed -i 's/\xc3\xaf/i/g' $LNG'_filtered.po'
#replace 'é' with 'e'
sed -i 's/\xc3\xa9/e/g' $LNG'_filtered.po'
#replace 'è' with 'e' (left)
sed -i 's/\xc3\xa8/e/g' $LNG'_filtered.po'
#replace 'ö' with 'o' (left)
sed -i 's/\xc3\xb6/o/g' $LNG'_filtered.po'
#replace 'ê' with 'e' (left)
sed -i 's/\xc3\xaa/e/g' $LNG'_filtered.po'
#replace 'ü' with 'u' (left)
sed -i 's/\xc3\xbc/u/g' $LNG'_filtered.po'
#replace 'ç' with 'c' (left)
sed -i 's/\xc3\xa7/c/g' $LNG'_filtered.po'
#replace 'á' with 'a' (left)
sed -i 's/\xc3\xa1/a/g' $LNG'_filtered.po'
#replace 'à' with 'a' (left)
sed -i 's/\xc3\xa0/a/g' $LNG'_filtered.po'
#replace 'ä' with 'a' (left)
sed -i 's/\xc3\xa4/a/g' $LNG'_filtered.po'
#replace 'û' with 'u' (left)
sed -i 's/\xc3\xbc/u/g' $LNG'_filtered.po'
#replace 'î' with 'i' (left)
sed -i 's/\xc3\xae/i/g' $LNG'_filtered.po'
#replace 'í' with 'i' (left)
sed -i 's/\xc3\xad/i/g' $LNG'_filtered.po'
#replace 'ô' with 'o' (left)
sed -i 's/\xc3\xb4/o/g' $LNG'_filtered.po'
#replace 'ú' with 'u' (left)
sed -i 's/\xc3\xba/u/g' $LNG'_filtered.po'
#replace 'ñ' with 'n' (left)
sed -i 's/\xc3\xb1/n/g' $LNG'_filtered.po'
#replace 'â' with 'a' (left)
sed -i 's/\xc3\xa2/a/g' $LNG'_filtered.po'
#replace 'Å' with 'A' (left)
sed -i 's/\xc3\x85/A/g' $LNG'_filtered.po'
fi
if [ "$LNG" = "sv" ]; then
#repace 'Å' with 'Aa'
sed -i 's/\xc3\x85/Aa/g' $LNG'_filtered.po'
#repace 'å' with 'aa'
sed -i 's/\xc3\xA5/aa/g' $LNG'_filtered.po'
fi
if [ "$LNG" = "da" ]; then
#repace 'Å' with 'Aa'
sed -i 's/\xc3\x85/Aa/g' $LNG'_filtered.po'
#repace 'å' with 'aa'
sed -i 's/\xc3\xA5/aa/g' $LNG'_filtered.po'
fi
if [ "$LNG" = "sl" ]; then
#replace 'ë' with 'e'
sed -i 's/\xc3\xab/e/g' $LNG'_filtered.po'
#replace 'ä' with 'a' (left)
sed -i 's/\xc3\xa4/a/g' $LNG'_filtered.po'
#replace 'é' with 'e'
sed -i 's/\xc3\xa9/e/g' $LNG'_filtered.po'
fi
if [ "$LNG" = "hu" ]; then # See https://www.fileformat.info/info/charset/UTF-8/list.htm
#replace 'Á' with 'A'(acute)
sed -i 's/\xc3\x81/A/g' $LNG'_filtered.po'
#replace 'á' with 'a'
sed -i 's/\xc3\xa1/a/g' $LNG'_filtered.po'
#replace 'É' with 'E' (acute)
sed -i 's/\xc3\x89/E/g' $LNG'_filtered.po'
#replace 'é' with 'e'
sed -i 's/\xc3\xa9/e/g' $LNG'_filtered.po'
#replace 'Í' with 'I' (acute)
sed -i 's/\xc3\x8d/I/g' $LNG'_filtered.po'
#replace 'i̇́' with 'i'
sed -i 's/\xc3\xad/i/g' $LNG'_filtered.po'
#replace 'Ó' with 'O' (acute)
sed -i 's/\xc3\x93/O/g' $LNG'_filtered.po'
#replace 'ó' with 'o'
sed -i 's/\xc3\xb3/o/g' $LNG'_filtered.po'
#replace 'Ö' with 'O' (diaresis)
sed -i 's/\xc3\x96/O/g' $LNG'_filtered.po'
#replace 'ö' with 'o'
sed -i 's/\xc3\xb6/o/g' $LNG'_filtered.po'
#replace 'Ő' with 'O' (double acute)
sed -i 's/\xc5\x90/O/g' $LNG'_filtered.po'
#replace 'ő' with 'o'
sed -i 's/\xc5\x91/o/g' $LNG'_filtered.po'
#replace 'Ú' with 'U' (acute)
sed -i 's/\xc3\x9a/U/g' $LNG'_filtered.po'
#replace 'ú' with 'u'
sed -i 's/\xc3\xba/u/g' $LNG'_filtered.po'
#replace 'Ü' with 'U' (diaersis)
sed -i 's/\xc3\x9c/U/g' $LNG'_filtered.po'
#replace 'ü' with 'u'
sed -i 's/\xc3\xbc/u/g' $LNG'_filtered.po'
#replace 'Ű' with 'U' (double acute)
sed -i 's/\xc5\xb0/U/g' $LNG'_filtered.po'
#replace 'ű' with 'u'
sed -i 's/\xc5\xb1/u/g' $LNG'_filtered.po'
fi
if [ "$LNG" = "lb" ]; then
#replace 'ë' with 'e'
sed -i 's/\xc3\xab/e/g' $LNG'_filtered.po'
#replace 'ä' with 'a'
sed -i 's/\xc3\xa4/a/g' $LNG'_filtered.po'
#replace 'é' with 'e'
sed -i 's/\xc3\xa9/e/g' $LNG'_filtered.po'
fi
if [ "$LNG" = "hr" ]; then
#replace 'ë' with 'e'
sed -i 's/\xc3\xab/e/g' $LNG'_filtered.po'
#replace 'ä' with 'a'
sed -i 's/\xc3\xa4/a/g' $LNG'_filtered.po'
#replace 'é' with 'e'
sed -i 's/\xc3\xa9/e/g' $LNG'_filtered.po'
fi
if [ "$LNG" = "lt" ]; then
#replace 'ë' with 'e'
sed -i 's/\xc3\xab/e/g' $LNG'_filtered.po'
#replace 'ä' with 'a'
sed -i 's/\xc3\xa4/a/g' $LNG'_filtered.po'
#replace 'é' with 'e'
sed -i 's/\xc3\xa9/e/g' $LNG'_filtered.po'
fi
#replace in polish translation
#if [ "$LNG" = "pl" ]; then
#fi
#replace in slovak translation
if [ "$LNG" = "sk" ]; then
#replace 'Á' with 'A'
sed -i 's/\xc3\x81/A/g' $LNG'_filtered.po'
#replace 'á' with 'a'
sed -i 's/\xc3\xa1/a/g' $LNG'_filtered.po'
#replace 'ä' with 'a'
sed -i 's/\xc3\xa4/a/g' $LNG'_filtered.po'
#replace 'Č' with 'C'
sed -i 's/\xc4\x8c/C/g' $LNG'_filtered.po'
#replace 'č' with 'c'
sed -i 's/\xc4\x8d/c/g' $LNG'_filtered.po'
#replace 'Ď' with 'D'
sed -i 's/\xc4\x8e/D/g' $LNG'_filtered.po'
#replace 'ď' with 'd'
sed -i 's/\xc4\x8f/d/g' $LNG'_filtered.po'
#replace 'É' with 'E'
sed -i 's/\xc3\x89/E/g' $LNG'_filtered.po'
#replace 'é' with 'e'
sed -i 's/\xc3\xa9/e/g' $LNG'_filtered.po'
#replace 'Í' with 'I'
sed -i 's/\xc3\x8d/I/g' $LNG'_filtered.po'
#replace 'í' with 'i'
sed -i 's/\xc3\xad/i/g' $LNG'_filtered.po'
#replace 'ľ' with 'l'
sed -i 's/\xc4\xbe/l/g' $LNG'_filtered.po'
#replace 'Ľ' with 'L'
sed -i 's/\xc4\xbd/L/g' $LNG'_filtered.po'
#replace 'Ň' with 'N'
sed -i 's/\xc5\x87/N/g' $LNG'_filtered.po'
#replace 'ň' with 'n'
sed -i 's/\xc5\x88/n/g' $LNG'_filtered.po'
#replace 'Ó' with 'O'
sed -i 's/\xc3\x93/O/g' $LNG'_filtered.po'
#replace 'ó' with 'o'
sed -i 's/\xc3\xb3/o/g' $LNG'_filtered.po'
#replace 'ô' with 'o'
sed -i 's/\xc3\xb4/o/g' $LNG'_filtered.po'
#replace 'Ô' with 'O'
sed -i 's/\xc3\x94/O/g' $LNG'_filtered.po'
#replace 'ŕ' with 'r'
sed -i 's/\xc5\x95/r/g' $LNG'_filtered.po'
#replace 'Ŕ' with 'R'
sed -i 's/\xc5\x94/R/g' $LNG'_filtered.po'
#replace 'Š' with 'S'
sed -i 's/\xc5\xa0/S/g' $LNG'_filtered.po'
#replace 'š' with 's'
sed -i 's/\xc5\xa1/s/g' $LNG'_filtered.po'
#replace 'Ť' with 'T'
sed -i 's/\xc5\xa4/T/g' $LNG'_filtered.po'
#replace 'ť' with 't'
sed -i 's/\xc5\xa5/t/g' $LNG'_filtered.po'
#replace 'Ú' with 'U'
sed -i 's/\xc3\x9a/U/g' $LNG'_filtered.po'
#replace 'ú' with 'u'
sed -i 's/\xc3\xba/u/g' $LNG'_filtered.po'
#replace 'Ý' with 'Y'
sed -i 's/\xc3\x9d/Y/g' $LNG'_filtered.po'
#replace 'ý' with 'y'
sed -i 's/\xc3\xbd/y/g' $LNG'_filtered.po'
#replace 'Ž' with 'Z'
sed -i 's/\xc5\xbd/Z/g' $LNG'_filtered.po'
#replace 'ž' with 'z'
sed -i 's/\xc5\xbe/z/g' $LNG'_filtered.po'
fi
#replace UTF-8 'μ' to HD44780 A00 'μ'
#replace 'μ' with 'A00 ROM μ'
sed -i 's/\xce\xbc/\\xe4/g' $LNG'_filtered.po'
#replace non-break space with space
sed -i 's/\xc2\xa0/ /g' $LNG'_filtered.po'
#check for nonasci characters except HD44780 ROM A00 'äöüß'
if grep --color='auto' -P -n '[^\x00-\x7F]' $LNG'_filtered.po' >nonascii.txt; then
exit
fi
#join lines with multi-line string constants
cat $LNG'_filtered.po' | sed ':a;N;$!ba;s/\x22\n\x22//g' > $LNG'_new.po'
#Get counter from po files
CNTTXT=$(grep '^# MSG' -c $LNGISO.po)
num=1
echo " selected language=$(tput setaf 2)$LNGISO$(tput sgr 0)" >&2
#generate new dictionary
cat ../../lang_en.txt | sed 's/\\/\\\\/g' | while read -r s; do
/bin/echo -e "$s"
#echo "s = $s ." >&2
if [ "${s:0:1}" = "\"" ]; then
# /bin/echo -e "$s"
s=$(/bin/echo -e "$s")
s2=$(grep -F -A1 -B0 "msgid $s" "$LNG"_new.po | tail -n1 | sed 's/^msgstr //')
if [ -z "$s2" ]; then
echo -ne " processing $num of $CNTTXT\033[0K\r" >&2
echo '"\x00"'
num=$((num+1))
else
echo -ne " processing $num of $CNTTXT\033[0K\r" >&2
echo "$s2"
num=$((num+1))
fi
# echo
fi
done > lang_en_$LNG.txt
echo >&2
echo "$(tput setaf 2)Finished with $LNGISO$(tput sgr 0)" >&2
#replace two double quotes to "\x00"
sed -i 's/""/"\\x00"/g' lang_en_$LNG.txt
#remove CR
sed -i "s/\r//g" lang_en_$LNG.txt
#check new lang
python3 ../../lang-check.py $LNG --warn-empty
python3 ../../lang-check.py $LNG --information >$LNG-output.txt
echo >&2
echo "$(tput setaf 2)lang-import.sh finished$(tput sgr 0)">&2