diff options
Diffstat (limited to 'sc/workben/celltrans')
-rw-r--r-- | sc/workben/celltrans/keywords_utf16.txt | bin | 0 -> 1830 bytes | |||
-rwxr-xr-x | sc/workben/celltrans/parse.py | 209 |
2 files changed, 209 insertions, 0 deletions
diff --git a/sc/workben/celltrans/keywords_utf16.txt b/sc/workben/celltrans/keywords_utf16.txt Binary files differnew file mode 100644 index 000000000000..5b00a5ffb7d2 --- /dev/null +++ b/sc/workben/celltrans/keywords_utf16.txt diff --git a/sc/workben/celltrans/parse.py b/sc/workben/celltrans/parse.py new file mode 100755 index 000000000000..ea1bf3ab6828 --- /dev/null +++ b/sc/workben/celltrans/parse.py @@ -0,0 +1,209 @@ +#!/usr/bin/env python +#*********************************************************************** +# +# DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. +# +# Copyright 2000, 2010 Oracle and/or its affiliates. +# +# OpenOffice.org - a multi-platform office productivity suite +# +# This file is part of OpenOffice.org. +# +# OpenOffice.org is free software: you can redistribute it and/or modify +# it under the terms of the GNU Lesser General Public License version 3 +# only, as published by the Free Software Foundation. +# +# OpenOffice.org is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU Lesser General Public License version 3 for more details +# (a copy is included in the LICENSE file that accompanied this code). +# +# You should have received a copy of the GNU Lesser General Public License +# version 3 along with OpenOffice.org. If not, see +# <http://www.openoffice.org/license.html> +# for a copy of the LGPLv3 License. +# +#*********************************************************************** + +import sys + +localeNames = {'fr': 'French', 'hu': 'Hungarian', 'de': 'German'} +def getLocaleName (code): + global localeNames + if localeNames.has_key(code): + return localeNames[code] + else: + return "(unknown locale)" + +def getAscii (ords): + ascii = '' + for c in ords: + ascii += chr(c) + return ascii + +class LocaleData(object): + def __init__ (self, locale): + self.locale = locale + self.funcList = {} + + def addKeywordMap (self, funcName, localeName, engName): + if not self.funcList.has_key(funcName): + self.funcList[funcName] = [] + + self.funcList[funcName].append([localeName, engName]) + + def getLocaleFuncVarName (self, func, pair): + return func.lower() + "_" + getAscii(pair[1]).lower() + "_" + self.locale + + def dumpCode (self): + chars = "" + + # locale output + chars += "// " + "-"*75 + "\n" + chars += "// %s language locale (automatically generated)\n"%getLocaleName(self.locale) + chars += "// " + "-"*75 + "\n" + chars += "static const Locale a" + self.locale.capitalize() + "(OUString::createFromAscii(\"" + chars += self.locale + chars += "\"), OUString(), OUString());\n\n" + + # pre instantiations of localized function names. + funcs = self.funcList.keys() + funcs.sort() + chars += "// pre instantiations of localized function names\n" + for func in funcs: + for item in self.funcList[func]: + chars += "static const sal_Unicode " + self.getLocaleFuncVarName(func, item) + "[] = {\n" + chars += " " + isFirst = True + # Dump the UTF-16 bytes. + for uval in item[0]: + if isFirst: + isFirst = False + else: + chars += ", " + chars += "0x%.4X"%uval + + # Don't forget to null-terminate the string. + if not isFirst: + chars += ", " + chars += "0x0000" + + chars += "};\n" + + # map item instantiations + chars += "\n" + chars += "static const TransItem p" + self.locale.capitalize() + "[] = {\n" + for func in funcs: + for item in self.funcList[func]: + chars += " " + chars += "{%s, \"%s\", %s},\n"%(self.getLocaleFuncVarName(func, item), + getAscii(item[1]), + "oc"+func.capitalize()) + + chars += " {NULL, NULL, ocNone}\n" + chars += "};\n\n" + + # addToMap call + chars += "addToMap(%s, %s);\n"%( + "p"+self.locale.capitalize(), "a"+self.locale.capitalize()) + + return chars + +class Parser(object): + + def __init__ (self, args): + # default input & output files. + self.infile = "./keywords_utf16.txt" + self.outfile = "../../source/core/tool/cellkeywords.inl" + + if len(args) >= 2: + self.infile = args[1] + if len(args) >= 3: + self.outfile = args[2] + + def getDByte (self): + # Assume little endian. + bh = ord(self.bytes[self.i]) + bl = ord(self.bytes[self.i+1]) + dbyte = bl*256 + bh + self.i += 2 + return dbyte + + def parseLine (self): + buf = [] + while self.i < self.size: + dbyte = self.getDByte() + if dbyte == 0x000A: + break + buf.append(dbyte) + return buf + + def dumpBuf (self, buf, linefeed=True): + for item in buf: + sys.stdout.write(chr(item)) + if linefeed: + print '' + + def parse (self): + + file = open(self.infile, 'r') + self.bytes = file.read() + file.close() + + self.size = len(self.bytes) + self.i = 0 + + localeList = [] # stores an array of locale data objects. + funcName = None + word = [] + wordPair = [] + + while self.i < self.size: + dbyte = self.getDByte() + if dbyte == 0xFEFF and self.i == 2: + # unicode signature - ignore it. + pass + elif dbyte == 0x0024: + # $ - locale name + buf = self.parseLine() + locale = getAscii(buf) + localeList.append(LocaleData(locale)) + + elif dbyte == 0x0040: + # @ - function name + buf = self.parseLine() + funcName = getAscii(buf) + + elif dbyte == 0x002C: + # , - comma separator + if len(word) > 0: + wordPair.append(word) + word = [] + elif dbyte == 0x000A: + # linefeed + if len(word) > 0: + wordPair.append(word) + word = [] + if len(wordPair) >= 2: + localeList[-1].addKeywordMap(funcName, wordPair[0], wordPair[1]) + wordPair = [] + elif dbyte in [0x0009, 0x0020]: + # whitespace - ignore it. + pass + else: + word.append(dbyte) + + chars = "// This file has been automatically generated. Do not hand-edit this!\n" + for obj in localeList: + chars += "\n" + obj.dumpCode() + + # Write to output file. + file = open(self.outfile, 'w') + file.write(chars) + file.close() + +if __name__=='__main__': + parser = Parser(sys.argv) + parser.parse() + |