63 lines
1.9 KiB
C++
63 lines
1.9 KiB
C++
/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
|
|
/*
|
|
* This file is part of the LibreOffice project.
|
|
*
|
|
* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
*/
|
|
|
|
#include <ToxWhitespaceStripper.hxx>
|
|
|
|
#include <o3tl/safeint.hxx>
|
|
#include <rtl/ustrbuf.hxx>
|
|
#include <sal/log.hxx>
|
|
|
|
|
|
namespace sw {
|
|
|
|
ToxWhitespaceStripper::ToxWhitespaceStripper(std::u16string_view inputString)
|
|
{
|
|
OUStringBuffer buffer;
|
|
|
|
bool lastCharacterWasWhitespace = false;
|
|
for (size_t pos = 0; pos < inputString.size(); ++pos) {
|
|
sal_Unicode cur = inputString[pos];
|
|
|
|
if (cur == ' ' || cur == '\n' || cur == '\t') {
|
|
// merge consecutive whitespaces (and translate them to spaces)
|
|
if (!lastCharacterWasWhitespace) {
|
|
buffer.append(' ');
|
|
}
|
|
lastCharacterWasWhitespace = true;
|
|
}
|
|
else {
|
|
buffer.append(cur);
|
|
lastCharacterWasWhitespace = false;
|
|
}
|
|
mNewPositions.push_back(buffer.getLength()-1);
|
|
}
|
|
// strip the last whitespace (if there was one)
|
|
if (lastCharacterWasWhitespace) {
|
|
buffer.truncate(buffer.getLength() - 1);
|
|
}
|
|
mNewPositions.push_back(buffer.getLength());
|
|
mStripped = buffer.makeStringAndClear();
|
|
}
|
|
|
|
|
|
sal_Int32
|
|
ToxWhitespaceStripper::GetPositionInStrippedString(sal_Int32 pos) const
|
|
{
|
|
assert(0 <= pos);
|
|
if (o3tl::make_unsigned(pos) >= mNewPositions.size()) {
|
|
// TODO probably this should assert, not just warn?
|
|
SAL_WARN("sw.core", "Requested position of TOX entry text which does not exist. "
|
|
"Maybe the formatting hint is corrupt?");
|
|
return mNewPositions.back();
|
|
}
|
|
return mNewPositions.at(pos);
|
|
}
|
|
|
|
|
|
}
|