diff options
Diffstat (limited to 'oox/source/token/namespaces.py')
-rw-r--r-- | oox/source/token/namespaces.py | 85 |
1 files changed, 85 insertions, 0 deletions
diff --git a/oox/source/token/namespaces.py b/oox/source/token/namespaces.py new file mode 100644 index 000000000..1244e88e8 --- /dev/null +++ b/oox/source/token/namespaces.py @@ -0,0 +1,85 @@ +# This file is part of the LibreOffice project. +# +# This Source Code Form is subject to the terms of the Mozilla Public +# License, v. 2.0. If a copy of the MPL was not distributed with this +# file, You can obtain one at http://mozilla.org/MPL/2.0/. +# +# This file incorporates work covered by the following license notice: +# +# Licensed to the Apache Software Foundation (ASF) under one or more +# contributor license agreements. See the NOTICE file distributed +# with this work for additional information regarding copyright +# ownership. The ASF licenses this file to you under the Apache +# License, Version 2.0 (the "License"); you may not use this file +# except in compliance with the License. You may obtain a copy of +# the License at http://www.apache.org/licenses/LICENSE-2.0 . +# + +import sys, re + +infile_name = sys.argv[1] +id_out_name = sys.argv[2] +name_out_name = sys.argv[3] +txt_out_name = sys.argv[4] +instrict_name = sys.argv[5] +strict_out_name = sys.argv[6] + +# parse input file + +namespaces = {} + +with open(infile_name) as infile: + for line in infile: + line = line.strip() + # trim comments + line = line.split('#')[0] + # skip empty lines + if line: + # check for valid characters + m = re.match(r'([a-zA-Z][a-zA-Z0-9]*)\s+([a-zA-Z0-9-.:\/]+)\s*$', line) + if not m: + sys.exit('Invalid character in input data: ' + line) + namespaces[m.group(1)] = m.group(2) + +# OOXML strict namespaces + +namespaces_strict = {} +with open(instrict_name) as infile_strict: + for line in infile_strict: + line = line.strip() + # trim comments + line = line.split('#')[0] + # skip empty lines + if line: + # check for valid characters + m = re.match(r'([a-zA-Z][a-zA-Z0-9]*)\s+([a-zA-Z0-9-.:\/]+)\s*$', line) + if not m: + sys.exit("Error: invalid character in input data: " + line) + namespaces_strict[m.group(1)] = m.group(2) + +# generate output files + +idfile = open(id_out_name, 'w') +namefile = open(name_out_name, 'w') +txtfile = open(txt_out_name, 'w') +namefile_strict = open(strict_out_name, 'w') + +# number of bits to shift the namespace identifier +shift = 16 + +idfile.write("const size_t NMSP_SHIFT = {};\n".format(shift)) + +i = 1; +for token in sorted(namespaces.keys()): + idfile.write("const sal_Int32 NMSP_{} = {} << NMSP_SHIFT;\n".format(token, i)) + cur_id = i << shift + namefile.write("{{ {}, \"{}\" }},\n".format(cur_id, namespaces[token])) + namefile_strict.write("{{ {}, \"{}\" }},\n".format(cur_id, namespaces_strict[token])) + txtfile.write("{} {} {}\n".format(cur_id, token, namespaces[token])) + txtfile.write("{} {} {}\n".format(cur_id, token, namespaces_strict[token])) + i += 1 + +idfile.close() +namefile.close() +namefile_strict.close() +txtfile.close() |