/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */ /* * This file is part of the LibreOffice project. * * This Source Code Form is subject to the terms of the Mozilla Public * License, v. 2.0. If a copy of the MPL was not distributed with this * file, You can obtain one at http://mozilla.org/MPL/2.0/. */ #include <ToxWhitespaceStripper.hxx> #include <o3tl/safeint.hxx> #include <rtl/ustrbuf.hxx> #include <sal/log.hxx> namespace sw { ToxWhitespaceStripper::ToxWhitespaceStripper(std::u16string_view inputString) { OUStringBuffer buffer; bool lastCharacterWasWhitespace = false; for (size_t pos = 0; pos < inputString.size(); ++pos) { sal_Unicode cur = inputString[pos]; if (cur == ' ' || cur == '\n' || cur == '\t') { // merge consecutive whitespaces (and translate them to spaces) if (!lastCharacterWasWhitespace) { buffer.append(' '); } lastCharacterWasWhitespace = true; } else { buffer.append(cur); lastCharacterWasWhitespace = false; } mNewPositions.push_back(buffer.getLength()-1); } // strip the last whitespace (if there was one) if (lastCharacterWasWhitespace) { buffer.truncate(buffer.getLength() - 1); } mNewPositions.push_back(buffer.getLength()); mStripped = buffer.makeStringAndClear(); } sal_Int32 ToxWhitespaceStripper::GetPositionInStrippedString(sal_Int32 pos) const { assert(0 <= pos); if (o3tl::make_unsigned(pos) >= mNewPositions.size()) { // TODO probably this should assert, not just warn? SAL_WARN("sw.core", "Requested position of TOX entry text which does not exist. " "Maybe the formatting hint is corrupt?"); return mNewPositions.back(); } return mNewPositions.at(pos); } }