1
0
Fork 0
libreoffice/sw/source/ui/uno/swdetect.cxx
Daniel Baumann 8e63e14cf6
Adding upstream version 4:25.2.3.
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
2025-06-22 16:20:04 +02:00

171 lines
6.7 KiB
C++

/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
/*
* This file is part of the LibreOffice project.
*
* This Source Code Form is subject to the terms of the Mozilla Public
* License, v. 2.0. If a copy of the MPL was not distributed with this
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
*
* This file incorporates work covered by the following license notice:
*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed
* with this work for additional information regarding copyright
* ownership. The ASF licenses this file to you under the Apache
* License, Version 2.0 (the "License"); you may not use this file
* except in compliance with the License. You may obtain a copy of
* the License at http://www.apache.org/licenses/LICENSE-2.0 .
*/
#include "swdetect.hxx"
#include <cppuhelper/supportsservice.hxx>
#include <com/sun/star/io/XInputStream.hpp>
#include <com/sun/star/uno/XComponentContext.hpp>
#include <sfx2/docfile.hxx>
#include <sot/storage.hxx>
#include <tools/urlobj.hxx>
#include <unotools/mediadescriptor.hxx>
using namespace ::com::sun::star;
using namespace ::com::sun::star::uno;
using namespace ::com::sun::star::io;
using namespace ::com::sun::star::task;
using namespace ::com::sun::star::beans;
using namespace ::com::sun::star::lang;
using utl::MediaDescriptor;
SwFilterDetect::SwFilterDetect()
{
}
SwFilterDetect::~SwFilterDetect()
{
}
OUString SAL_CALL SwFilterDetect::detect( Sequence< PropertyValue >& lDescriptor )
{
MediaDescriptor aMediaDesc( lDescriptor );
OUString aTypeName = aMediaDesc.getUnpackedValueOrDefault( MediaDescriptor::PROP_TYPENAME, OUString() );
uno::Reference< io::XInputStream > xInStream ( aMediaDesc[MediaDescriptor::PROP_INPUTSTREAM], uno::UNO_QUERY );
if ( !xInStream.is() )
return OUString();
SfxMedium aMedium;
aMedium.UseInteractionHandler( false );
aMedium.setStreamToLoadFrom( xInStream, true );
SvStream *pInStrm = aMedium.GetInStream();
if ( !pInStrm || pInStrm->GetError() )
return OUString();
bool bIsDetected = false;
if ( aTypeName == "writer_Rich_Text_Format" )
{
pInStrm->Seek( STREAM_SEEK_TO_BEGIN );
bIsDetected = ( read_uInt8s_ToOString( *pInStrm, 5 ) == "{\\rtf" );
}
else if ( aTypeName == "writer_MS_WinWord_5" )
{
pInStrm->Seek( STREAM_SEEK_TO_BEGIN );
const sal_uInt8 nBufSize = 3;
sal_uInt8 nBuffer[ nBufSize ];
if (pInStrm->ReadBytes(nBuffer, nBufSize) < nBufSize)
return OUString();
bIsDetected = (nBuffer[0] == 0x9B && nBuffer[1] == 0xA5 && nBuffer[2] == 0x21) // WinWord 1
|| (nBuffer[0] == 0x9C && nBuffer[1] == 0xA5 && nBuffer[2] == 0x21) // PMWord 1
|| (nBuffer[0] == 0xDB && nBuffer[1] == 0xA5 && nBuffer[2] == 0x2D) // WinWord 2
|| (nBuffer[0] == 0xDC && nBuffer[1] == 0xA5 && nBuffer[2] == 0x65); // WinWord 6.0/95, as a single stream file
}
else
{
// Do not attempt to create an SotStorage on a
// 0-length stream as that would create the compound
// document header on the stream and effectively write to
// disk!
pInStrm->Seek( STREAM_SEEK_TO_BEGIN );
if ( pInStrm->remainingSize() == 0 )
return OUString();
try
{
rtl::Reference<SotStorage> aStorage = new SotStorage ( pInStrm, false );
if ( !aStorage->GetError() )
{
bIsDetected = aStorage->IsContained( u"WordDocument"_ustr );
if ( bIsDetected && aTypeName.startsWith( "writer_MS_Word_97" ) )
{
bIsDetected = ( aStorage->IsContained(u"0Table"_ustr) || aStorage->IsContained(u"1Table"_ustr) );
// If we are checking the template type, and the document is not a .dot, don't
// mis-detect it.
if ( bIsDetected && aTypeName == "writer_MS_Word_97_Vorlage" )
{
// It is common practice to rename a .doc to .dot to make it a template.
// Since we have detected a.doc-ish format, always accept .dot-named-files
// as valid templates to avoid flagging this as an invalid .dot format..
INetURLObject aParser(aMediaDesc.getUnpackedValueOrDefault(
utl::MediaDescriptor::PROP_URL, OUString()));
// Super ugly hack, but we don't want to use the whole WW8Fib thing here in
// the swd library, apparently. We know (do we?) that the "aBits1" byte, as
// the variable is called in WW8Fib::WW8Fib(SvStream&,sal_uInt8,sal_uInt32),
// is at offset 10 in the WordDocument stream. The fDot bit is bit 0x01 of
// that byte.
if (aParser.getExtension().toAsciiLowerCase() != "dot")
{
rtl::Reference<SotStorageStream> xWordDocument
= aStorage->OpenSotStream(u"WordDocument"_ustr, StreamMode::STD_READ);
xWordDocument->Seek(10);
if (xWordDocument->Tell() == 10)
{
sal_uInt8 aBits1;
xWordDocument->ReadUChar(aBits1);
// Check fDot bit
bIsDetected = ((aBits1 & 0x01) == 0x01);
}
}
}
}
}
}
catch (...)
{
bIsDetected = false;
}
}
if ( bIsDetected )
return aTypeName;
return OUString();
}
/* XServiceInfo */
OUString SAL_CALL SwFilterDetect::getImplementationName()
{
return u"com.sun.star.comp.writer.FormatDetector"_ustr;
}
/* XServiceInfo */
sal_Bool SAL_CALL SwFilterDetect::supportsService( const OUString& sServiceName )
{
return cppu::supportsService(this, sServiceName);
}
/* XServiceInfo */
Sequence< OUString > SAL_CALL SwFilterDetect::getSupportedServiceNames()
{
return { u"com.sun.star.frame.ExtendedTypeDetection"_ustr, u"com.sun.star.text.FormatDetector"_ustr, u"com.sun.star.text.W4WFormatDetector"_ustr };
}
extern "C" SAL_DLLPUBLIC_EXPORT css::uno::XInterface*
com_sun_star_comp_writer_FormatDetector_get_implementation(css::uno::XComponentContext*,
css::uno::Sequence<css::uno::Any> const &)
{
return cppu::acquire(new SwFilterDetect());
}
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */