summaryrefslogtreecommitdiffstats
path: root/kexi/kexiutils/generate_transliteration_table.sh
blob: 05470772b3ac0cc84ac7d7cbdb7c206eea014eaa (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
#!/bin/bash
#
#   Copyright (C) 2006-2007 Jaroslaw Staniek <js@iidea.pl>
#
#   Based on the original script by Michal Svec <rebel@atrey.karlin.mff.cuni.cz>
#
#   This program is free software; you can redistribute it and/or
#   modify it under the terms of the GNU General Public
#   License as published by the Free Software Foundation; either
#   version 2 of the License, or (at your option) any later version.
#
#   This program is distributed in the hope that it will be useful,
#   but WITHOUT ANY WARRANTY; without even the implied warranty of
#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
#    General Public License for more details.
#
#   You should have received a copy of the GNU General Public License
#   along with this program; see the file COPYING.  If not, write to
#   the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
#   Boston, MA 02110-1301, USA.

#
# Generates a transliteration_table.{h|cpp} files using recode's "flat" character set
#

out_cpp="transliteration_table.cpp"
out_h="transliteration_table.h"
max=65534

decl="const char *const transliteration_table[TRANSLITERATION_TABLE_SIZE + 1]"

header=\
"/* Transliteration table of `expr $max + 1` unicode characters
   Do not edit this file, it is generated
   by $0 script. */

"
echo "$header
#define TRANSLITERATION_TABLE_SIZE `expr $max + 1`
extern $decl;
" > $out_h

echo "$header
#include \"$out_h\"
$decl = {
" > $out_cpp

for i in `seq 0 $max` ; do
	f=`printf "%04x" $i`
	if [ "$i" -lt 16 -o "$i" -eq 92 ] ; then
		printf "$i\n/*$f*/\n_\n" $i
	elif [ "$i" -lt 128 ] ; then
		ch=`printf "%03o" $i`
		printf "$i\n/*$f*/\n\\"$ch"\n"
	else
		{ /usr/bin/printf "${i}\n/*${f}*/\n\u${f}\n" 2>&- || echo "_"; }
	fi
done | \
while read i && read f && read ch; do
	if ! expr "$i" % 8 > /dev/null ; then
		expr "$i" % 320 > /dev/null || echo -n ..`expr "$i" \* 100 / $max `% >&2 #progress
		echo
	else
		f= # <-- comment to add /*numbers*/ everywhere
	fi
	r=`echo -n "$ch" | recode -f utf-8..flat | \
		sed -r -e 's/[^[:alnum:]]//g;s/_+/_/g'`
	if [ -z "$r" -o "$r" == "_" ] ; then
		echo -n "${f}0/*${ch}*/,"
	else
		echo -n "${f}\"$r\"/*${ch}*/,"
	fi
done >> $out_cpp

echo "0};" >> $out_cpp;