diff options
author | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-04-15 05:48:59 +0000 |
---|---|---|
committer | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-04-15 05:48:59 +0000 |
commit | c484829272cd13a738e35412498e12f2c9a194ac (patch) | |
tree | a1f5ec09629ee895bd3963fa8820b45f2f4c574b /src/parser/sax_token_parser.cpp | |
parent | Initial commit. (diff) | |
download | liborcus-upstream.tar.xz liborcus-upstream.zip |
Adding upstream version 0.19.2.upstream/0.19.2upstream
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'src/parser/sax_token_parser.cpp')
-rw-r--r-- | src/parser/sax_token_parser.cpp | 110 |
1 files changed, 110 insertions, 0 deletions
diff --git a/src/parser/sax_token_parser.cpp b/src/parser/sax_token_parser.cpp new file mode 100644 index 0000000..fdf80c6 --- /dev/null +++ b/src/parser/sax_token_parser.cpp @@ -0,0 +1,110 @@ +/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */ +/* + * This Source Code Form is subject to the terms of the Mozilla Public + * License, v. 2.0. If a copy of the MPL was not distributed with this + * file, You can obtain one at http://mozilla.org/MPL/2.0/. + */ + +#include "orcus/sax_token_parser.hpp" +#include "orcus/tokens.hpp" + +#include <mdds/sorted_string_map.hpp> +#include <cctype> + +namespace orcus { + +namespace { + +enum class decl_attr_type { unknown, version, encoding, standalone }; + +namespace decl_attr { + +using map_type = mdds::sorted_string_map<decl_attr_type, mdds::string_view_map_entry>; + +// Keys must be sorted. +constexpr map_type::entry entries[] = { + { "encoding", decl_attr_type::encoding }, + { "standalone", decl_attr_type::standalone }, + { "version", decl_attr_type::version }, +}; + +const map_type& get() +{ + static map_type mt(entries, std::size(entries), decl_attr_type::unknown); + return mt; +} + +} // namespace decl_attr + +} + +sax_token_handler_wrapper_base::sax_token_handler_wrapper_base(const tokens& _tokens) : + m_tokens(_tokens) {} + +xml_token_t sax_token_handler_wrapper_base::tokenize(std::string_view name) const +{ + xml_token_t token = XML_UNKNOWN_TOKEN; + if (!name.empty()) + token = m_tokens.get_token(name); + return token; +} + +void sax_token_handler_wrapper_base::set_element(const sax_ns_parser_element& elem) +{ + m_elem.ns = elem.ns; + m_elem.name = tokenize(elem.name); + m_elem.raw_name = elem.name; +} + +void sax_token_handler_wrapper_base::attribute(std::string_view name, std::string_view val) +{ + decl_attr_type dat = decl_attr::get().find(name); + + switch (dat) + { + case decl_attr_type::version: + { + const char* p = val.data(); + const char* p_end = p + val.size(); + + long v; + const char* endptr = parse_integer(p, p_end, v); + + if (!endptr || endptr >= p_end || *endptr != '.') + break; + + m_declaration.version_major = v; + p = endptr + 1; + + endptr = parse_integer(p, p_end, v); + + if (!endptr || endptr > p_end) + break; + + m_declaration.version_minor = v; + break; + } + case decl_attr_type::encoding: + { + m_declaration.encoding = to_character_set(val); + break; + } + case decl_attr_type::standalone: + m_declaration.standalone = (val == "yes") ? true : false; + break; + default: + ; + } +} + +void sax_token_handler_wrapper_base::attribute(const sax_ns_parser_attribute& attr) +{ + m_elem.attrs.push_back( + xml_token_attr_t( + attr.ns, tokenize(attr.name), attr.name, + attr.value, attr.transient)); +} + +} + +/* vim:set shiftwidth=4 softtabstop=4 expandtab: */ |