summaryrefslogtreecommitdiffstats
path: root/sw/source/ui/uno/swdetect.cxx
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-07 09:06:44 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-07 09:06:44 +0000
commited5640d8b587fbcfed7dd7967f3de04b37a76f26 (patch)
tree7a5f7c6c9d02226d7471cb3cc8fbbf631b415303 /sw/source/ui/uno/swdetect.cxx
parentInitial commit. (diff)
downloadlibreoffice-upstream.tar.xz
libreoffice-upstream.zip
Adding upstream version 4:7.4.7.upstream/4%7.4.7upstream
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'sw/source/ui/uno/swdetect.cxx')
-rw-r--r--sw/source/ui/uno/swdetect.cxx171
1 files changed, 171 insertions, 0 deletions
diff --git a/sw/source/ui/uno/swdetect.cxx b/sw/source/ui/uno/swdetect.cxx
new file mode 100644
index 000000000..83b7162ae
--- /dev/null
+++ b/sw/source/ui/uno/swdetect.cxx
@@ -0,0 +1,171 @@
+/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
+/*
+ * This file is part of the LibreOffice project.
+ *
+ * This Source Code Form is subject to the terms of the Mozilla Public
+ * License, v. 2.0. If a copy of the MPL was not distributed with this
+ * file, You can obtain one at http://mozilla.org/MPL/2.0/.
+ *
+ * This file incorporates work covered by the following license notice:
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed
+ * with this work for additional information regarding copyright
+ * ownership. The ASF licenses this file to you under the Apache
+ * License, Version 2.0 (the "License"); you may not use this file
+ * except in compliance with the License. You may obtain a copy of
+ * the License at http://www.apache.org/licenses/LICENSE-2.0 .
+ */
+
+#include "swdetect.hxx"
+
+#include <cppuhelper/supportsservice.hxx>
+#include <com/sun/star/io/XInputStream.hpp>
+#include <com/sun/star/uno/XComponentContext.hpp>
+#include <sfx2/docfile.hxx>
+#include <sot/storage.hxx>
+#include <tools/urlobj.hxx>
+#include <unotools/mediadescriptor.hxx>
+
+using namespace ::com::sun::star;
+using namespace ::com::sun::star::uno;
+using namespace ::com::sun::star::io;
+using namespace ::com::sun::star::task;
+using namespace ::com::sun::star::beans;
+using namespace ::com::sun::star::lang;
+using utl::MediaDescriptor;
+
+SwFilterDetect::SwFilterDetect()
+{
+}
+
+SwFilterDetect::~SwFilterDetect()
+{
+}
+
+OUString SAL_CALL SwFilterDetect::detect( Sequence< PropertyValue >& lDescriptor )
+{
+ MediaDescriptor aMediaDesc( lDescriptor );
+ OUString aTypeName = aMediaDesc.getUnpackedValueOrDefault( MediaDescriptor::PROP_TYPENAME, OUString() );
+ uno::Reference< io::XInputStream > xInStream ( aMediaDesc[MediaDescriptor::PROP_INPUTSTREAM], uno::UNO_QUERY );
+ if ( !xInStream.is() )
+ return OUString();
+
+ SfxMedium aMedium;
+ aMedium.UseInteractionHandler( false );
+ aMedium.setStreamToLoadFrom( xInStream, true );
+
+ SvStream *pInStrm = aMedium.GetInStream();
+ if ( !pInStrm || pInStrm->GetError() )
+ return OUString();
+
+ bool bIsDetected = false;
+
+ if ( aTypeName == "writer_Rich_Text_Format" )
+ {
+ pInStrm->Seek( STREAM_SEEK_TO_BEGIN );
+ bIsDetected = ( read_uInt8s_ToOString( *pInStrm, 5 ) == "{\\rtf" );
+ }
+ else if ( aTypeName == "writer_MS_WinWord_5" )
+ {
+ pInStrm->Seek( STREAM_SEEK_TO_BEGIN );
+ const sal_uInt8 nBufSize = 3;
+ sal_uInt8 nBuffer[ nBufSize ];
+ if (pInStrm->ReadBytes(nBuffer, nBufSize) < nBufSize)
+ return OUString();
+
+ bIsDetected = (nBuffer[0] == 0x9B && nBuffer[1] == 0xA5 && nBuffer[2] == 0x21) // WinWord 1
+ || (nBuffer[0] == 0x9C && nBuffer[1] == 0xA5 && nBuffer[2] == 0x21) // PMWord 1
+ || (nBuffer[0] == 0xDB && nBuffer[1] == 0xA5 && nBuffer[2] == 0x2D) // WinWord 2
+ || (nBuffer[0] == 0xDC && nBuffer[1] == 0xA5 && nBuffer[2] == 0x65); // WinWord 6.0/95, as a single stream file
+ }
+ else
+ {
+ // Do not attempt to create an SotStorage on a
+ // 0-length stream as that would create the compound
+ // document header on the stream and effectively write to
+ // disk!
+ pInStrm->Seek( STREAM_SEEK_TO_BEGIN );
+ if ( pInStrm->remainingSize() == 0 )
+ return OUString();
+
+ try
+ {
+ tools::SvRef<SotStorage> aStorage = new SotStorage ( pInStrm, false );
+ if ( !aStorage->GetError() )
+ {
+ bIsDetected = aStorage->IsContained( "WordDocument" );
+ if ( bIsDetected && aTypeName.startsWith( "writer_MS_Word_97" ) )
+ {
+ bIsDetected = ( aStorage->IsContained("0Table") || aStorage->IsContained("1Table") );
+
+ // If we are checking the template type, and the document is not a .dot, don't
+ // mis-detect it.
+ if ( bIsDetected && aTypeName == "writer_MS_Word_97_Vorlage" )
+ {
+ // It is common practice to rename a .doc to .dot to make it a template.
+ // Since we have detected a.doc-ish format, always accept .dot-named-files
+ // as valid templates to avoid flagging this as an invalid .dot format..
+ INetURLObject aParser(aMediaDesc.getUnpackedValueOrDefault(
+ utl::MediaDescriptor::PROP_URL, OUString()));
+
+ // Super ugly hack, but we don't want to use the whole WW8Fib thing here in
+ // the swd library, apparently. We know (do we?) that the "aBits1" byte, as
+ // the variable is called in WW8Fib::WW8Fib(SvStream&,sal_uInt8,sal_uInt32),
+ // is at offset 10 in the WordDocument stream. The fDot bit is bit 0x01 of
+ // that byte.
+ if (aParser.getExtension().toAsciiLowerCase() != "dot")
+ {
+ tools::SvRef<SotStorageStream> xWordDocument
+ = aStorage->OpenSotStream("WordDocument", StreamMode::STD_READ);
+ xWordDocument->Seek(10);
+ if (xWordDocument->Tell() == 10)
+ {
+ sal_uInt8 aBits1;
+ xWordDocument->ReadUChar(aBits1);
+ // Check fDot bit
+ bIsDetected = ((aBits1 & 0x01) == 0x01);
+ }
+ }
+ }
+ }
+ }
+ }
+ catch (...)
+ {
+ bIsDetected = false;
+ }
+ }
+
+ if ( bIsDetected )
+ return aTypeName;
+
+ return OUString();
+}
+
+/* XServiceInfo */
+OUString SAL_CALL SwFilterDetect::getImplementationName()
+{
+ return "com.sun.star.comp.writer.FormatDetector";
+}
+
+/* XServiceInfo */
+sal_Bool SAL_CALL SwFilterDetect::supportsService( const OUString& sServiceName )
+{
+ return cppu::supportsService(this, sServiceName);
+}
+
+/* XServiceInfo */
+Sequence< OUString > SAL_CALL SwFilterDetect::getSupportedServiceNames()
+{
+ return { "com.sun.star.frame.ExtendedTypeDetection", "com.sun.star.text.FormatDetector", "com.sun.star.text.W4WFormatDetector" };
+}
+
+extern "C" SAL_DLLPUBLIC_EXPORT css::uno::XInterface*
+com_sun_star_comp_writer_FormatDetector_get_implementation(css::uno::XComponentContext*,
+ css::uno::Sequence<css::uno::Any> const &)
+{
+ return cppu::acquire(new SwFilterDetect());
+}
+
+/* vim:set shiftwidth=4 softtabstop=4 expandtab: */