# SUCH DAMAGE. import re import string import sys import generate import UnicodeData import util if len(sys.argv) != 4: print "usage: %s UnicodeData.txt" " CompositionExclusions-3.2.0.txt out-dir" % sys.argv[0] sys.exit(1) ud = UnicodeData.read(sys.argv[1]) def sortedKeys(d): """Return a sorted list of the keys of a dict""" keys = d.keys() keys.sort() return keys trans = dict([(k, [re.sub('<[a-zA-Z]+>', '', v[4]), v[0]]) for k,v in ud.items() if v[4]]) maxLength = 0 for v in trans.values(): maxLength = max(maxLength, len(v[0].split())) normalize_h = generate.Header('%s/normalize_table.h' % sys.argv[3])
# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY # OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF # SUCH DAMAGE. import re import string import sys import generate import UnicodeData if len(sys.argv) != 3: print "usage: %s UnicodeData.txt out-dir" % sys.argv[0] sys.exit(1) ud = UnicodeData.read(sys.argv[1]) trans = {} for k,v in ud.items(): if int(v[2]) != 0 : trans[k] = [int(v[2]), v[1]] # trans = [(x[0], int(x[3]), x[1]) for x in UnicodeData.read() if int(x[3]) != 0] combining_h = generate.Header('%s/combining_table.h' % sys.argv[2]) combining_c = generate.Implementation('%s/combining_table.c' % sys.argv[2]) combining_h.file.write( ''' #include <krb5-types.h>
# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY # OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF # SUCH DAMAGE. import re import string import sys import generate import UnicodeData if len(sys.argv) != 3: print "usage: %s UnicodeData.txt out-dir" % sys.argv[0] sys.exit(1) ud = UnicodeData.read(sys.argv[1]) trans = {} for k, v in ud.items(): if int(v[2]) != 0: trans[k] = [int(v[2]), v[1]] # trans = [(x[0], int(x[3]), x[1]) for x in UnicodeData.read() if int(x[3]) != 0] combining_h = generate.Header('%s/combining_table.h' % sys.argv[2]) combining_c = generate.Implementation('%s/combining_table.c' % sys.argv[2]) combining_h.file.write(''' #include <krb5-types.h> struct translation {
# SUCH DAMAGE. import re import string import sys import generate import UnicodeData import util if len(sys.argv) != 4: print "usage: %s UnicodeData.txt" " CompositionExclusions-3.2.0.txt out-dir" % sys.argv[0] sys.exit(1) ud = UnicodeData.read(sys.argv[1]) def sortedKeys(d): """Return a sorted list of the keys of a dict""" keys = d.keys() keys.sort() return keys trans = dict([(k, [re.sub('<[a-zA-Z]+>', '', v[4]), v[0]]) for k, v in ud.items() if v[4]]) maxLength = 0 for v in trans.values(): maxLength = max(maxLength, len(v[0].split()))
#!/usr/bin/python # -*- coding: utf-8 -*- import sys import UnicodeData import struct if len(sys.argv) != 2: print >> sys.stderr, "Usage: %s <unicode_data_dir>" % sys.argv[0] print >> sys.stderr, "Takes UnicodeData.txt, PropList.txt ... and turns into optimized table files" sys.exit(99) unicode_data_dir = sys.argv[1] UnicodeData.read(unicode_data_dir) last_codepoint = max(UnicodeData.data.keys()) print "Last codepoint: %d" % last_codepoint ## Generate codepoint->script mapping script_name_to_code_mapping = { "Adlam": 1, "Ahom": 2, "Anatolian_Hieroglyphs": 3, "Arabic": 4, "Armenian": 5, "Avestan": 6, "Balinese": 7, "Bamum": 8, "Bassa_Vah": 9, "Batak": 10, "Bengali": 11,