Adding upstream version 4:24.2.0.upstream/4%24.2.0

Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
author: Daniel Baumann <daniel.baumann@progress-linux.org> 2024-04-15 05:54:39 +0000
committer: Daniel Baumann <daniel.baumann@progress-linux.org> 2024-04-15 05:54:39 +0000
commit: 267c6f2ac71f92999e969232431ba04678e7437e (patch)
tree: 358c9467650e1d0a1d7227a21dac2e3d08b622b2 /l10ntools/source/lngmerge.cxx
parent: Initial commit. (diff)
download: libreoffice-267c6f2ac71f92999e969232431ba04678e7437e.tar.xz
libreoffice-267c6f2ac71f92999e969232431ba04678e7437e.zip
1 files changed, 281 insertions, 0 deletions
diff --git a/l10ntools/source/lngmerge.cxx b/l10ntools/source/lngmerge.cxx
new file mode 100644
index 0000000000..4eaa94940c
--- /dev/null
+++ b/l10ntools/source/lngmerge.cxx
@@ -0,0 +1,281 @@
+/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
+/*
+ * This file is part of the LibreOffice project.
+ *
+ * This Source Code Form is subject to the terms of the Mozilla Public
+ * License, v. 2.0. If a copy of the MPL was not distributed with this
+ * file, You can obtain one at http://mozilla.org/MPL/2.0/.
+ *
+ * This file incorporates work covered by the following license notice:
+ *
+ *   Licensed to the Apache Software Foundation (ASF) under one or more
+ *   contributor license agreements. See the NOTICE file distributed
+ *   with this work for additional information regarding copyright
+ *   ownership. The ASF licenses this file to you under the Apache
+ *   License, Version 2.0 (the "License"); you may not use this file
+ *   except in compliance with the License. You may obtain a copy of
+ *   the License at http://www.apache.org/licenses/LICENSE-2.0 .
+ */
+
+#include <sal/config.h>
+
+#include <o3tl/string_view.hxx>
+
+#include <cstddef>
+#include <iostream>
+#include <memory>
+#include <string>
+
+#include <common.hxx>
+#include <po.hxx>
+#include <lngmerge.hxx>
+#include <utility>
+
+namespace {
+
+bool lcl_isNextGroup(OString &sGroup_out, std::string_view sLineTrim)
+{
+    if (o3tl::starts_with(sLineTrim, "[") && o3tl::ends_with(sLineTrim, "]"))
+    {
+        sLineTrim = o3tl::getToken(sLineTrim, 1, '[');
+        sLineTrim = o3tl::getToken(sLineTrim, 0, ']');
+        sGroup_out = OString(o3tl::trim(sLineTrim));
+        return true;
+    }
+    return false;
+}
+
+void lcl_RemoveUTF8ByteOrderMarker( OString &rString )
+{
+    if( rString.getLength() >= 3 && rString[0] == '\xEF' &&
+        rString[1] == '\xBB' && rString[2] == '\xBF' )
+    {
+        rString = rString.copy(3);
+    }
+}
+
+}
+
+
+
+LngParser::LngParser(OString sLngFile)
+    : sSource(std::move( sLngFile ))
+{
+    std::ifstream aStream(sSource.getStr());
+    if (!aStream.is_open())
+        return;
+
+    bool bFirstLine = true;
+    std::string s;
+    std::getline(aStream, s);
+    while (!aStream.eof())
+    {
+        OString sLine(s.data(), s.length());
+
+        if( bFirstLine )
+        {
+            // Always remove UTF8 BOM from the first line
+            lcl_RemoveUTF8ByteOrderMarker( sLine );
+            bFirstLine = false;
+        }
+
+        mvLines.push_back( sLine );
+        std::getline(aStream, s);
+    }
+    mvLines.push_back( OString() );
+}
+
+LngParser::~LngParser()
+{
+}
+
+void LngParser::CreatePO( const OString &rPOFile )
+{
+    PoOfstream aPOStream( rPOFile, PoOfstream::APP );
+    if (!aPOStream.isOpen()) {
+        std::cerr << "Ulfex error: Can't open po file:" << rPOFile << "\n";
+    }
+
+    size_t nPos  = 0;
+    bool bStart = true;
+    OString sGroup, sLine;
+    OStringHashMap Text;
+    OString sID;
+
+    while( nPos < mvLines.size() ) {
+        sLine = mvLines[ nPos++ ];
+        while( nPos < mvLines.size() && !isNextGroup( sGroup , sLine ) ) {
+            ReadLine( sLine , Text );
+            sID = sGroup;
+            sLine = mvLines[ nPos++ ];
+        }
+        if( bStart ) {
+            bStart = false;
+            sID = sGroup;
+        }
+        else {
+            WritePO( aPOStream , Text , sSource , sID );
+        }
+        Text.erase("x-comment"_ostr);
+    }
+    aPOStream.close();
+}
+
+void LngParser::WritePO(PoOfstream &aPOStream,
+    OStringHashMap &rText_inout, const OString &rActFileName,
+    const OString &rID)
+{
+    common::writePoEntry(
+        "Ulfex"_ostr, aPOStream, rActFileName, "LngText",
+        rID, OString(), rText_inout.count("x-comment"_ostr) ? rText_inout["x-comment"_ostr] : OString(), rText_inout["en-US"_ostr]);
+}
+
+bool LngParser::isNextGroup(OString &sGroup_out, std::string_view sLine_in)
+{
+    return lcl_isNextGroup(sGroup_out, o3tl::trim(sLine_in));
+}
+
+void LngParser::ReadLine(std::string_view rLine_in,
+        OStringHashMap &rText_inout)
+{
+    if (!o3tl::starts_with(rLine_in, " *") && !o3tl::starts_with(rLine_in, "/*"))
+    {
+        OString sLang(o3tl::trim(o3tl::getToken(rLine_in, 0, '=')));
+        if (!sLang.isEmpty()) {
+            OString sText(o3tl::getToken(rLine_in,1, '"'));
+            rText_inout[sLang] = sText;
+        }
+    }
+}
+
+void LngParser::Merge(
+    const OString &rPOFile,
+    const OString &rDestinationFile,
+    std::string_view rLanguage )
+{
+    std::ofstream aDestination(
+        rDestinationFile.getStr(), std::ios_base::out | std::ios_base::trunc);
+
+    MergeDataFile aMergeDataFile( rPOFile, sSource, false, true );
+    if( o3tl::equalsIgnoreAsciiCase(rLanguage, "ALL") )
+        aLanguages = aMergeDataFile.GetLanguages();
+
+    size_t nPos = 0;
+    bool bGroup = false;
+    OString sGroup;
+
+    // seek to next group
+    while ( nPos < mvLines.size() && !bGroup )
+        bGroup = lcl_isNextGroup(sGroup, o3tl::trim(mvLines[nPos++]));
+
+    while ( nPos < mvLines.size()) {
+        OStringHashMap Text;
+        OString sID( sGroup );
+        std::size_t nLastLangPos = 0;
+
+        ResData aResData( sID, sSource );
+        aResData.sResTyp = "LngText"_ostr;
+        MergeEntrys *pEntrys = aMergeDataFile.GetMergeEntrys( &aResData );
+        // read languages
+        bGroup = false;
+
+        OString sLanguagesDone;
+
+        while ( nPos < mvLines.size() && !bGroup )
+        {
+            const OString sLine{ mvLines[nPos].trim() };
+            if ( lcl_isNextGroup(sGroup, sLine) )
+            {
+                bGroup = true;
+                nPos ++;
+                sLanguagesDone = ""_ostr;
+            }
+            else
+            {
+                sal_Int32 n = 0;
+                OString sLang(sLine.getToken(0, '=', n));
+                if (n == -1 || static_cast<bool>(sLine.match("/*")))
+                {
+                    ++nPos;
+                }
+                else
+                {
+                    sLang = sLang.trim();
+
+                    OString sSearch{ ";" + sLang + ";" };
+
+                    if ( sLanguagesDone.indexOf( sSearch ) != -1 ) {
+                        mvLines.erase( mvLines.begin() + nPos );
+                    }
+                    if( pEntrys )
+                    {
+                        if( !sLang.isEmpty() )
+                        {
+                            OString sNewText;
+                            pEntrys->GetText( sNewText, sLang, true );
+                            if( sLang == "qtz" )
+                                continue;
+
+                            if ( !sNewText.isEmpty()) {
+                                mvLines[ nPos ] = sLang
+                                    + " = \""
+                                    // escape quotes, unescape double escaped quotes fdo#56648
+                                    + sNewText.replaceAll("\""_ostr,"\\\""_ostr).replaceAll("\\\\\""_ostr,"\\\""_ostr)
+                                    + "\"";
+                                Text[ sLang ] = sNewText;
+                            }
+                        }
+                        nLastLangPos = nPos;
+                        nPos ++;
+                        sLanguagesDone += sSearch;
+                    }
+                    else {
+                        nLastLangPos = nPos;
+                        nPos ++;
+                        sLanguagesDone += sSearch;
+                    }
+                }
+            }
+        }
+        OString sCur;
+        if ( nLastLangPos )
+        {
+            for(size_t n = 0; n < aLanguages.size(); ++n)
+            {
+                sCur = aLanguages[ n ];
+                if( !sCur.equalsIgnoreAsciiCase("en-US") && Text[sCur].isEmpty() && pEntrys )
+                {
+
+                    OString sNewText;
+                    pEntrys->GetText( sNewText, sCur, true );
+                    if( sCur == "qtz" )
+                        continue;
+                    if ( !sNewText.isEmpty() && sCur != "x-comment")
+                    {
+                        const OString sLine { sCur
+                            + " = \""
+                            // escape quotes, unescape double escaped quotes fdo#56648
+                            + sNewText.replaceAll("\""_ostr,"\\\""_ostr).replaceAll("\\\\\""_ostr,"\\\""_ostr)
+                            + "\"" };
+
+                        nLastLangPos++;
+                        nPos++;
+
+                        if ( nLastLangPos < mvLines.size() ) {
+                            mvLines.insert( mvLines.begin() + nLastLangPos, sLine );
+                        } else {
+                            mvLines.push_back( sLine );
+                        }
+                    }
+                }
+            }
+        }
+    }
+
+    for ( size_t i = 0; i < mvLines.size(); ++i )
+        aDestination << mvLines[i] << '\n';
+
+    aDestination.close();
+}
+
+/* vim:set shiftwidth=4 softtabstop=4 expandtab: */
author	Daniel Baumann <daniel.baumann@progress-linux.org>	2024-04-15 05:54:39 +0000
committer	Daniel Baumann <daniel.baumann@progress-linux.org>	2024-04-15 05:54:39 +0000
commit	267c6f2ac71f92999e969232431ba04678e7437e (patch)
tree	358c9467650e1d0a1d7227a21dac2e3d08b622b2 /l10ntools/source/lngmerge.cxx
parent	Initial commit. (diff)
download	libreoffice-267c6f2ac71f92999e969232431ba04678e7437e.tar.xz libreoffice-267c6f2ac71f92999e969232431ba04678e7437e.zip