From ed5640d8b587fbcfed7dd7967f3de04b37a76f26 Mon Sep 17 00:00:00 2001 From: Daniel Baumann Date: Sun, 7 Apr 2024 11:06:44 +0200 Subject: Adding upstream version 4:7.4.7. Signed-off-by: Daniel Baumann --- sdext/source/pdfimport/test/tests.cxx | 904 ++++++++++++++++++++++++++++++++++ 1 file changed, 904 insertions(+) create mode 100644 sdext/source/pdfimport/test/tests.cxx (limited to 'sdext/source/pdfimport/test/tests.cxx') diff --git a/sdext/source/pdfimport/test/tests.cxx b/sdext/source/pdfimport/test/tests.cxx new file mode 100644 index 000000000..b569a1443 --- /dev/null +++ b/sdext/source/pdfimport/test/tests.cxx @@ -0,0 +1,904 @@ +/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */ +/* + * This file is part of the LibreOffice project. + * + * This Source Code Form is subject to the terms of the Mozilla Public + * License, v. 2.0. If a copy of the MPL was not distributed with this + * file, You can obtain one at http://mozilla.org/MPL/2.0/. + * + * This file incorporates work covered by the following license notice: + * + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed + * with this work for additional information regarding copyright + * ownership. The ASF licenses this file to you under the Apache + * License, Version 2.0 (the "License"); you may not use this file + * except in compliance with the License. You may obtain a copy of + * the License at http://www.apache.org/licenses/LICENSE-2.0 . + */ + +#include + +#include "outputwrap.hxx" +#include +#include +#include +#include +#include "../pdfiadaptor.hxx" + +#include +#include +#include +#include + +#include +#include +#include +#include +#include + +#include +#include +#include +#include +#include + +#include +#include +#include +#include + +#include +#include + +#include +#include + +using namespace ::pdfparse; +using namespace ::pdfi; +using namespace ::com::sun::star; + +namespace +{ + + class TestSink : public ContentSink + { + public: + TestSink() : + m_nNextFontId( 1 ), + m_aIdToFont(), + m_aFontToId(), + m_aGCStack(1), + m_aPageSize(), + m_aHyperlinkBounds(), + m_aURI(), + m_aTextOut(), + m_nNumPages(0), + m_bPageEnded(false), + m_bRedCircleSeen(false), + m_bGreenStrokeSeen(false), + m_bDashedLineSeen(false), + m_bImageSeen(false) + {} + + void check() + { + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "A4 page size (in 100th of points): Width", 79400, m_aPageSize.Width, 0.00000001); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "A4 page size (in 100th of points): Height", 59500, m_aPageSize.Height, 0.0000001 ); + CPPUNIT_ASSERT_MESSAGE( "endPage() called", m_bPageEnded ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Num pages equal one", sal_Int32(1), m_nNumPages ); + CPPUNIT_ASSERT_MESSAGE( "Correct hyperlink bounding box", + rtl::math::approxEqual(m_aHyperlinkBounds.X1,34.7 ) ); + CPPUNIT_ASSERT_MESSAGE( "Correct hyperlink bounding box", + rtl::math::approxEqual(m_aHyperlinkBounds.Y1,386.0) ); + CPPUNIT_ASSERT_MESSAGE( "Correct hyperlink bounding box", + rtl::math::approxEqual(m_aHyperlinkBounds.X2,166.7) ); + CPPUNIT_ASSERT_MESSAGE( "Correct hyperlink bounding box", + rtl::math::approxEqual(m_aHyperlinkBounds.Y2,406.2) ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Correct hyperlink URI", OUString("http://download.openoffice.org/"), m_aURI ); + + const char* const sText = " \n \nThis is a testtext\nNew paragraph,\nnew line\n" + "Hyperlink, this is\n?\nThis is more text\noutline mode\n?\nNew paragraph\n"; + OString aTmp; + m_aTextOut.makeStringAndClear().convertToString( &aTmp, + RTL_TEXTENCODING_ASCII_US, + OUSTRING_TO_OSTRING_CVTFLAGS ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Imported text is \"This is a testtext New paragraph, new line" + " Hyperlink, this is * This is more text outline mode * New paragraph\"", + aTmp, OString(sText) ); + + CPPUNIT_ASSERT_MESSAGE( "red circle seen in input", m_bRedCircleSeen ); + CPPUNIT_ASSERT_MESSAGE( "green stroke seen in input", m_bGreenStrokeSeen ); + CPPUNIT_ASSERT_MESSAGE( "dashed line seen in input", m_bDashedLineSeen ); + CPPUNIT_ASSERT_MESSAGE( "image seen in input", m_bImageSeen ); + } + + private: + GraphicsContext& getCurrentContext() { return m_aGCStack.back(); } + + // ContentSink interface implementation + virtual void setPageNum( sal_Int32 nNumPages ) override + { + m_nNumPages = nNumPages; + } + + virtual void startPage( const geometry::RealSize2D& rSize ) override + { + m_aPageSize = rSize; + } + + virtual void endPage() override + { + m_bPageEnded = true; + } + + virtual void hyperLink( const geometry::RealRectangle2D& rBounds, + const OUString& rURI ) override + { + m_aHyperlinkBounds = rBounds; + m_aURI = rURI; + } + + virtual void pushState() override + { + GraphicsContextStack::value_type const a(m_aGCStack.back()); + m_aGCStack.push_back(a); + } + + virtual void popState() override + { + m_aGCStack.pop_back(); + } + + virtual void setTransformation( const geometry::AffineMatrix2D& rMatrix ) override + { + basegfx::unotools::homMatrixFromAffineMatrix( + getCurrentContext().Transformation, + rMatrix ); + } + + virtual void setLineDash( const uno::Sequence& dashes, + double start ) override + { + GraphicsContext& rContext( getCurrentContext() ); + if( dashes.hasElements() ) + comphelper::sequenceToContainer(rContext.DashArray,dashes); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "line dashing start offset", 0.0, start, 0.000000001 ); + } + + virtual void setFlatness( double nFlatness ) override + { + getCurrentContext().Flatness = nFlatness; + } + + virtual void setLineJoin(sal_Int8 nJoin) override + { + getCurrentContext().LineJoin = nJoin; + } + + virtual void setLineCap(sal_Int8 nCap) override + { + getCurrentContext().LineCap = nCap; + } + + virtual void setMiterLimit(double nVal) override + { + getCurrentContext().MiterLimit = nVal; + } + + virtual void setLineWidth(double nVal) override + { + getCurrentContext().LineWidth = nVal; + } + + virtual void setFillColor( const rendering::ARGBColor& rColor ) override + { + getCurrentContext().FillColor = rColor; + } + + virtual void setStrokeColor( const rendering::ARGBColor& rColor ) override + { + getCurrentContext().LineColor = rColor; + } + + virtual void setFont( const FontAttributes& rFont ) override + { + FontToIdMap::const_iterator it = m_aFontToId.find( rFont ); + if( it != m_aFontToId.end() ) + getCurrentContext().FontId = it->second; + else + { + m_aFontToId[ rFont ] = m_nNextFontId; + m_aIdToFont[ m_nNextFontId ] = rFont; + getCurrentContext().FontId = m_nNextFontId; + m_nNextFontId++; + } + } + + virtual void strokePath( const uno::Reference& rPath ) override + { + GraphicsContext& rContext( getCurrentContext() ); + basegfx::B2DPolyPolygon aPath = basegfx::unotools::b2DPolyPolygonFromXPolyPolygon2D(rPath); + aPath.transform( rContext.Transformation ); + + if( rContext.DashArray.empty() ) + { + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is green", 1.0, rContext.LineColor.Alpha, 0.00000001); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is green", 0.0, rContext.LineColor.Blue, 0.00000001); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is green", 1.0, rContext.LineColor.Green, 0.00000001); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is green", 0.0, rContext.LineColor.Red, 0.00000001); + + CPPUNIT_ASSERT_MESSAGE( "Line width is 0", + rtl::math::approxEqual(rContext.LineWidth, 28.3) ); + + static constexpr OUStringLiteral sExportString = u"m53570 7650-35430 24100"; + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Stroke is m535.7 518.5-354.3-241", + OUString(sExportString), basegfx::utils::exportToSvgD( aPath, true, true, false ) ); + + m_bGreenStrokeSeen = true; + } + else + { + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Dash array consists of four entries", std::vector::size_type(4), rContext.DashArray.size()); + CPPUNIT_ASSERT_DOUBLES_EQUAL( 14.3764, rContext.DashArray[0], 1E-12 ); + CPPUNIT_ASSERT_DOUBLES_EQUAL( rContext.DashArray[0], rContext.DashArray[1], 1E-12 ); + CPPUNIT_ASSERT_DOUBLES_EQUAL( rContext.DashArray[1], rContext.DashArray[2], 1E-12 ); + CPPUNIT_ASSERT_DOUBLES_EQUAL( rContext.DashArray[2], rContext.DashArray[3], 1E-12 ); + + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is black", 1.0, rContext.LineColor.Alpha, 0.00000001); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is black", 0.0, rContext.LineColor.Blue, 0.00000001); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is black", 0.0, rContext.LineColor.Green, 0.00000001); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is black", 0.0, rContext.LineColor.Red, 0.00000001); + + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line width is 0", + 0, rContext.LineWidth, 0.0000001 ); + + static constexpr OUStringLiteral sExportString = u"m49890 5670.00000000001-35430 24090"; + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Stroke is m49890 5670.00000000001-35430 24090", + OUString(sExportString), basegfx::utils::exportToSvgD( aPath, true, true, false ) ); + + m_bDashedLineSeen = true; + } + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Blend mode is normal", + rendering::BlendMode::NORMAL, rContext.BlendMode ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Join type is round", + rendering::PathJoinType::ROUND, rContext.LineJoin ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Cap type is butt", + rendering::PathCapType::BUTT, rContext.LineCap ); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line miter limit is 10", + 10, rContext.MiterLimit, 0.0000001 ); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Flatness is 0", + 1, rContext.Flatness, 0.00000001 ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Font id is 0", + sal_Int32(0), rContext.FontId ); + } + + virtual void fillPath( const uno::Reference& rPath ) override + { + GraphicsContext& rContext( getCurrentContext() ); + basegfx::B2DPolyPolygon aPath = basegfx::unotools::b2DPolyPolygonFromXPolyPolygon2D(rPath); + aPath.transform( rContext.Transformation ); + + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is black", 1.0, rContext.LineColor.Alpha, 0.00000001); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is black", 0.0, rContext.LineColor.Blue, 0.00000001); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is black", 0.0, rContext.LineColor.Green, 0.00000001); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is black", 0.0, rContext.LineColor.Red, 0.00000001); + + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Blend mode is normal", + rendering::BlendMode::NORMAL, rContext.BlendMode ); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Flatness is 10", + 10, rContext.Flatness, 0.00000001 ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Font id is 0", + sal_Int32(0), rContext.FontId ); + } + + virtual void eoFillPath( const uno::Reference& rPath ) override + { + GraphicsContext& rContext( getCurrentContext() ); + basegfx::B2DPolyPolygon aPath = basegfx::unotools::b2DPolyPolygonFromXPolyPolygon2D(rPath); + aPath.transform( rContext.Transformation ); + + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is black", 1.0, rContext.LineColor.Alpha, 0.00000001); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is black", 0.0, rContext.LineColor.Blue, 0.00000001); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is black", 0.0, rContext.LineColor.Green, 0.00000001); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Line color is black", 0.0, rContext.LineColor.Red, 0.00000001); + + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Blend mode is normal", + rendering::BlendMode::NORMAL, rContext.BlendMode ); + CPPUNIT_ASSERT_DOUBLES_EQUAL_MESSAGE( "Flatness is 0", + 1, rContext.Flatness, 0.00000001 ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Font id is 0", + sal_Int32(0), rContext.FontId ); + + static constexpr OUStringLiteral sExportString + = u"m12050 49610c-4310 0-7800-3490-7800-7800 0-4300 " + "3490-7790 7800-7790 4300 0 7790 3490 7790 7790 0 4310-3490 7800-7790 7800z"; + CPPUNIT_ASSERT_EQUAL_MESSAGE( "Stroke is a 4-bezier circle", + OUString(sExportString), basegfx::utils::exportToSvgD( aPath, true, true, false ) ); + + m_bRedCircleSeen = true; + } + + virtual void intersectClip(const uno::Reference& rPath) override + { + basegfx::B2DPolyPolygon aNewClip = basegfx::unotools::b2DPolyPolygonFromXPolyPolygon2D(rPath); + basegfx::B2DPolyPolygon aCurClip = getCurrentContext().Clip; + + if( aCurClip.count() ) // #i92985# adapted API from (..., false, false) to (..., true, false) + aNewClip = basegfx::utils::clipPolyPolygonOnPolyPolygon( aCurClip, aNewClip, true, false ); + + getCurrentContext().Clip = aNewClip; + } + + virtual void intersectEoClip(const uno::Reference& rPath) override + { + basegfx::B2DPolyPolygon aNewClip = basegfx::unotools::b2DPolyPolygonFromXPolyPolygon2D(rPath); + basegfx::B2DPolyPolygon aCurClip = getCurrentContext().Clip; + + if( aCurClip.count() ) // #i92985# adapted API from (..., false, false) to (..., true, false) + aNewClip = basegfx::utils::clipPolyPolygonOnPolyPolygon( aCurClip, aNewClip, true, false ); + + getCurrentContext().Clip = aNewClip; + } + + virtual void drawGlyphs( const OUString& rGlyphs, + const geometry::RealRectangle2D& /*rRect*/, + const geometry::Matrix2D& /*rFontMatrix*/, + double /*fontSize*/) override + { + m_aTextOut.append(rGlyphs); + } + + virtual void endText() override + { + m_aTextOut.append( "\n" ); + } + + virtual void drawMask(const uno::Sequence& xBitmap, + bool /*bInvert*/ ) override + { + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawMask received two properties", + sal_Int32(3), xBitmap.getLength() ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawMask got URL param", + OUString("URL"), xBitmap[0].Name ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawMask got InputStream param", + OUString("InputStream"), xBitmap[1].Name ); + } + + virtual void drawImage(const uno::Sequence& xBitmap ) override + { + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawImage received two properties", + sal_Int32(3), xBitmap.getLength() ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawImage got URL param", + OUString("URL"), xBitmap[0].Name ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawImage got InputStream param", + OUString("InputStream"), xBitmap[1].Name ); + m_bImageSeen = true; + } + + virtual void drawColorMaskedImage(const uno::Sequence& xBitmap, + const uno::Sequence& /*xMaskColors*/ ) override + { + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawColorMaskedImage received two properties", + sal_Int32(3), xBitmap.getLength() ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawColorMaskedImage got URL param", + OUString("URL"), xBitmap[0].Name ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawColorMaskedImage got InputStream param", + OUString("InputStream"), xBitmap[1].Name ); + } + + virtual void drawMaskedImage(const uno::Sequence& xBitmap, + const uno::Sequence& xMask, + bool /*bInvertMask*/) override + { + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawMaskedImage received two properties #1", + sal_Int32(3), xBitmap.getLength() ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawMaskedImage got URL param #1", + OUString("URL"), xBitmap[0].Name ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawMaskedImage got InputStream param #1", + OUString("InputStream"), xBitmap[1].Name ); + + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawMaskedImage received two properties #2", + sal_Int32(3), xMask.getLength() ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawMaskedImage got URL param #2", + OUString("URL"), xMask[0].Name ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawMaskedImage got InputStream param #2", + OUString("InputStream"), xMask[1].Name ); + } + + virtual void drawAlphaMaskedImage(const uno::Sequence& xBitmap, + const uno::Sequence& xMask) override + { + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawAlphaMaskedImage received two properties #1", + sal_Int32(3), xBitmap.getLength() ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawAlphaMaskedImage got URL param #1", + OUString("URL"), xBitmap[0].Name ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawAlphaMaskedImage got InputStream param #1", + OUString("InputStream"), xBitmap[1].Name ); + + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawAlphaMaskedImage received two properties #2", + sal_Int32(3), xMask.getLength() ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawAlphaMaskedImage got URL param #2", + OUString("URL"), xMask[0].Name ); + CPPUNIT_ASSERT_EQUAL_MESSAGE( "drawAlphaMaskedImage got InputStream param #2", + OUString("InputStream"), xMask[1].Name ); + } + + virtual void setTextRenderMode( sal_Int32 ) override + { + } + + typedef std::unordered_map IdToFontMap; + typedef std::unordered_map FontToIdMap; + + typedef std::vector GraphicsContextStack; + + sal_Int32 m_nNextFontId; + IdToFontMap m_aIdToFont; + FontToIdMap m_aFontToId; + + GraphicsContextStack m_aGCStack; + geometry::RealSize2D m_aPageSize; + geometry::RealRectangle2D m_aHyperlinkBounds; + OUString m_aURI; + OUStringBuffer m_aTextOut; + sal_Int32 m_nNumPages; + bool m_bPageEnded; + bool m_bRedCircleSeen; + bool m_bGreenStrokeSeen; + bool m_bDashedLineSeen; + bool m_bImageSeen; + }; + + class PDFITest : public test::BootstrapFixture, public XmlTestTools + { + protected: + virtual void registerNamespaces(xmlXPathContextPtr& pXmlXPathCtx) override + { + XmlTestTools::registerODFNamespaces(pXmlXPathCtx); + }; + public: + void testXPDFParser() + { +#if HAVE_FEATURE_POPPLER + auto pSink = std::make_shared(); + CPPUNIT_ASSERT( + pdfi::xpdf_ImportFromFile( + m_directories.getURLFromSrc(u"/sdext/source/pdfimport/test/testinput.pdf"), + pSink, + uno::Reference< task::XInteractionHandler >(), + OUString(), + getComponentContext(), "" ) ); + pSink->check(); +#endif + } + + void testOdfDrawExport() + { +#if HAVE_FEATURE_POPPLER + rtl::Reference xAdaptor( new pdfi::PDFIRawAdaptor(OUString(), getComponentContext()) ); + xAdaptor->setTreeVisitorFactory( createDrawTreeVisitorFactory() ); + + OUString tempFileURL; + CPPUNIT_ASSERT_EQUAL( osl::File::E_None, osl::File::createTempFile( nullptr, nullptr, &tempFileURL ) ); + osl::File::remove( tempFileURL ); // FIXME the below apparently fails silently if the file already exists + CPPUNIT_ASSERT_MESSAGE("Exporting to ODF", + xAdaptor->odfConvert( m_directories.getURLFromSrc(u"/sdext/source/pdfimport/test/testinput.pdf"), + new OutputWrap(tempFileURL), + nullptr )); + osl::File::remove( tempFileURL ); +#endif + } + + void testOdfWriterExport() + { +#if HAVE_FEATURE_POPPLER + rtl::Reference xAdaptor( new pdfi::PDFIRawAdaptor(OUString(), getComponentContext()) ); + xAdaptor->setTreeVisitorFactory( createWriterTreeVisitorFactory() ); + + OUString tempFileURL; + CPPUNIT_ASSERT_EQUAL( osl::File::E_None, osl::File::createTempFile( nullptr, nullptr, &tempFileURL ) ); + osl::File::remove( tempFileURL ); // FIXME the below apparently fails silently if the file already exists + CPPUNIT_ASSERT_MESSAGE("Exporting to ODF", + xAdaptor->odfConvert( m_directories.getURLFromSrc(u"/sdext/source/pdfimport/test/testinput.pdf"), + new OutputWrap(tempFileURL), + nullptr )); + osl::File::remove( tempFileURL ); +#endif + } + + void testTdf96993() + { +#if HAVE_FEATURE_POPPLER + rtl::Reference xAdaptor(new pdfi::PDFIRawAdaptor(OUString(), getComponentContext())); + xAdaptor->setTreeVisitorFactory(createDrawTreeVisitorFactory()); + + OString aOutput; + CPPUNIT_ASSERT_MESSAGE("Exporting to ODF", + xAdaptor->odfConvert(m_directories.getURLFromSrc(u"/sdext/source/pdfimport/test/testTdf96993.pdf"), + new OutputWrapString(aOutput), + nullptr)); + // This ensures that the imported image arrives properly flipped + CPPUNIT_ASSERT(aOutput.indexOf("draw:transform=\"matrix(18520.8333333333 0 0 26281.9444444444 0 0)\"") != -1); +#endif + } + + void testTdf98421() + { +#if HAVE_FEATURE_POPPLER + rtl::Reference xAdaptor(new pdfi::PDFIRawAdaptor(OUString(), getComponentContext())); + xAdaptor->setTreeVisitorFactory(createWriterTreeVisitorFactory()); + + OString aOutput; + CPPUNIT_ASSERT_MESSAGE("Exporting to ODF", + xAdaptor->odfConvert(m_directories.getURLFromSrc(u"/sdext/source/pdfimport/test/testTdf96993.pdf"), + new OutputWrapString(aOutput), + nullptr)); + // This ensures that the imported image arrives properly flipped + CPPUNIT_ASSERT(aOutput.indexOf("draw:transform=\"scale( 1.0 -1.0 ) translate( 0mm 0mm )\"") != -1); + CPPUNIT_ASSERT(aOutput.indexOf("svg:height=\"-262.82mm\"") != -1); +#endif + } + + void testTdf105536() + { +#if HAVE_FEATURE_POPPLER + rtl::Reference xAdaptor(new pdfi::PDFIRawAdaptor(OUString(), getComponentContext())); + xAdaptor->setTreeVisitorFactory(createDrawTreeVisitorFactory()); + + OString aOutput; + CPPUNIT_ASSERT_MESSAGE("Exporting to ODF", + xAdaptor->odfConvert(m_directories.getURLFromSrc(u"/sdext/source/pdfimport/test/testTdf105536.pdf"), + new OutputWrapString(aOutput), + nullptr)); + // This ensures that the imported image arrives properly flipped + CPPUNIT_ASSERT(aOutput.indexOf("draw:transform=\"matrix(-21488.4 0 0 -27978.1 21488.4 27978.1)\"") != -1); +#endif + } + + void testTdf141709() + { +// this test crashes on the windows jenkins boxes, but no-one can catch it locally +#if HAVE_FEATURE_POPPLER && !defined(_WIN32) + rtl::Reference xAdaptor(new pdfi::PDFIRawAdaptor(OUString(), getComponentContext())); + xAdaptor->setTreeVisitorFactory(createDrawTreeVisitorFactory()); + + OString aOutput; + CPPUNIT_ASSERT_MESSAGE("Exporting to ODF", + xAdaptor->odfConvert(m_directories.getURLFromSrc(u"/sdext/source/pdfimport/test/testTdf141709.pdf"), + new OutputWrapString(aOutput), + nullptr)); + std::cout << aOutput << std::endl; + // This ensures that the imported text contains all of the characters + CPPUNIT_ASSERT(aOutput.indexOf("敏") != -1); + CPPUNIT_ASSERT(aOutput.indexOf("捷") != -1); + CPPUNIT_ASSERT(aOutput.indexOf("的") != -1); + CPPUNIT_ASSERT(aOutput.indexOf("狐") != -1); + CPPUNIT_ASSERT(aOutput.indexOf("狸") != -1); + CPPUNIT_ASSERT(aOutput.indexOf("跨") != -1); + CPPUNIT_ASSERT(aOutput.indexOf("过") != -1); + CPPUNIT_ASSERT(aOutput.indexOf("慵") != -1); + CPPUNIT_ASSERT(aOutput.indexOf("懒") != -1); + CPPUNIT_ASSERT(aOutput.indexOf("的") != -1); + CPPUNIT_ASSERT(aOutput.indexOf("狗") != -1); + CPPUNIT_ASSERT(aOutput.indexOf("。") != -1); +#endif + } + + void testTdf78427_FontFeatures() + { + rtl::Reference xAdaptor(new pdfi::PDFIRawAdaptor(OUString(), getComponentContext())); + xAdaptor->setTreeVisitorFactory(createDrawTreeVisitorFactory()); + + OString aOutput; + CPPUNIT_ASSERT_MESSAGE("Converting PDF to ODF XML", + xAdaptor->odfConvert( m_directories.getURLFromSrc( + u"/sdext/source/pdfimport/test/testdocs/tdf78427-testFontFeatures.pdf"), + new OutputWrapString(aOutput), + nullptr )); + // Un-comment the following debug line to see the content of generated XML content in + // workdir/CppunitTest/sdext_pdfimport.test.log after running "make CppunitTest_sdext_pdfimport". + //std::cout << aOutput << std::endl; + xmlDocUniquePtr pXmlDoc(xmlParseDoc(reinterpret_cast(aOutput.getStr()))); + //CPPUNIT_ASSERT(pXmlDoc); + + /* Test for the 1st paragraph */ + OUString styleName = getXPath(pXmlDoc, "//draw:frame[1]//text:span[1]", "style-name"); + OString xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + // the font-weight and font-style should be normal + assertXPath(pXmlDoc, xpath, "font-weight", "normal"); + assertXPathNoAttribute(pXmlDoc, xpath, "font-style"); + + /* Test for the 2nd paragraph */ + styleName = getXPath(pXmlDoc, "//draw:frame[2]//text:span[1]", "style-name"); + xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + // there should be a font-weight="bold", but no font-style italic + assertXPath(pXmlDoc, xpath, "font-weight", "bold"); + assertXPathNoAttribute(pXmlDoc, xpath, "font-style"); + + /* Test for the 3rd paragraph */ + styleName = getXPath(pXmlDoc, "//draw:frame[3]//text:span[1]", "style-name"); + xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + // there should be a font-style="italic", but no font-weight bold + assertXPath(pXmlDoc, xpath, "font-weight", "normal"); + assertXPath(pXmlDoc, xpath, "font-style", "italic"); + + /* Test for the 4th paragraph */ + styleName = getXPath(pXmlDoc, "//draw:frame[4]//text:span[1]", "style-name"); + xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + // there should be both font-style="italic" and font-weight="bold" + assertXPath(pXmlDoc, xpath, "font-weight", "bold"); + assertXPath(pXmlDoc, xpath, "font-style", "italic"); + + /* Test for the 5th paragraph */ + styleName = getXPath(pXmlDoc, "//draw:frame[5]//text:span[1]", "style-name"); + xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + // the font should be Arial and font-weight="bold", no font-style + assertXPath(pXmlDoc, xpath, "font-family", "Arial"); + assertXPath(pXmlDoc, xpath, "font-weight", "bold"); + assertXPathNoAttribute(pXmlDoc, xpath, "font-style"); + + /* Test for the 6th paragraph */ + styleName = getXPath(pXmlDoc, "//draw:frame[6]//text:span[1]", "style-name"); + xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + // the font should be Arial without font-weight and font-style + assertXPath(pXmlDoc, xpath, "font-family", "Arial"); + assertXPath(pXmlDoc, xpath, "font-weight", "normal"); + assertXPathNoAttribute(pXmlDoc, xpath, "font-style"); + + /* Test for the 7th paragraph */ + styleName = getXPath(pXmlDoc, "//draw:frame[7]//text:span[1]", "style-name"); + xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + // the font should be SimSun without font-weight and font-style + assertXPath(pXmlDoc, xpath, "font-family", "SimSun"); // TODO: tdf#143095 use localized font name rather than PS name + assertXPath(pXmlDoc, xpath, "font-weight", "normal"); + assertXPathNoAttribute(pXmlDoc, xpath, "font-style"); + + /* Test for the 8th paragraph */ + styleName = getXPath(pXmlDoc, "//draw:frame[8]//text:span[1]", "style-name"); + xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + // the font should be SimSun and font-weight="bold", no font-style italic + assertXPath(pXmlDoc, xpath, "font-family", "SimSun"); + assertXPath(pXmlDoc, xpath, "font-weight", "bold"); + assertXPathNoAttribute(pXmlDoc, xpath, "font-style"); + + /* Test for the 9th paragraph */ + styleName = getXPath(pXmlDoc, "//draw:frame[9]//text:span[1]", "style-name"); + xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + // the font should be SimSun, font-weight should be "normal", font-style="italic" + assertXPath(pXmlDoc, xpath, "font-family", "SimSun"); + assertXPath(pXmlDoc, xpath, "font-weight", "normal"); + // FIXME and remove the below comment: + // the chinese chars are shown in pdf as faux italic (fake italic). It is currencly imported wrongly as normal font style. + // See tdf#78427 for how the faux bold problem was handled. Faux italic may be handled using the transformation pattern. + // assertXPath(pXmlDoc, xpath, "font-style", "italic"); + + /* Test for the 10th paragraph */ + styleName = getXPath(pXmlDoc, "//draw:frame[10]//text:span[1]", "style-name"); + xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + // the font should be SimSun font-weight="bold" and font-style="italic" + assertXPath(pXmlDoc, xpath, "font-family", "SimSun"); + assertXPath(pXmlDoc, xpath, "font-weight", "bold"); + // FIXME: faux italic, see above + // assertXPath(pXmlDoc, xpath, "font-style", "italic"); + + /* Test for the 11th paragraph */ + styleName = getXPath(pXmlDoc, "//draw:frame[11]//text:span[1]", "style-name"); + xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + // the font should be SimSun and there should be style:text-outline="true" + // (i.e., the real "outline" font rather than faux bold / fake bold) + assertXPath(pXmlDoc, xpath, "font-family", "SimSun"); + assertXPath(pXmlDoc, xpath, "font-weight", "normal"); + assertXPathNoAttribute(pXmlDoc, xpath, "font-style"); + assertXPath(pXmlDoc, xpath, "text-outline", "true"); + } + + void testTdf78427_FontWeight_MyraidProSemibold() // Related to attachment 155937. + { + rtl::Reference xAdaptor(new pdfi::PDFIRawAdaptor(OUString(), getComponentContext())); + xAdaptor->setTreeVisitorFactory(createDrawTreeVisitorFactory()); + + OString aOutput; + CPPUNIT_ASSERT_MESSAGE("Converting PDF to ODF XML", + xAdaptor->odfConvert( m_directories.getURLFromSrc( + u"/sdext/source/pdfimport/test/testdocs/tdf78427-MyraidPro-Semibold-Light.pdf"), + new OutputWrapString(aOutput), + nullptr )); + //std::cout << aOutput << std::endl; + + xmlDocUniquePtr pXmlDoc(xmlParseDoc(reinterpret_cast(aOutput.getStr()))); + //CPPUNIT_ASSERT(pXmlDoc); + + // The for the 1st frame */ + OUString styleName = getXPath(pXmlDoc, "//draw:frame[1]//text:span[1]", "style-name"); + OString xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + // the font-weight and font-style should be 600 (Semibold) + assertXPath(pXmlDoc, xpath, "font-weight", "600"); + + // The for the 2nd frame */ + styleName = getXPath(pXmlDoc, "//draw:frame[2]//text:span[1]", "style-name"); + xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + // the font-weight and font-style should be 300 (Light) + assertXPath(pXmlDoc, xpath, "font-weight", "300"); + } + + void testTdf143959_nameFromFontFile() + { + rtl::Reference xAdaptor(new pdfi::PDFIRawAdaptor(OUString(), getComponentContext())); + xAdaptor->setTreeVisitorFactory(createDrawTreeVisitorFactory()); + + OString aOutput; + CPPUNIT_ASSERT_MESSAGE("Converting PDF to ODF XML", + xAdaptor->odfConvert( m_directories.getURLFromSrc(u"/sdext/source/pdfimport/test/testdocs/testTdf143959.pdf"), + new OutputWrapString(aOutput), + nullptr )); + + //std::cout << aOutput << std::endl; + xmlDocUniquePtr pXmlDoc(xmlParseDoc(reinterpret_cast(aOutput.getStr()))); + + /* Test for the 1st text paragraph */ + OUString styleName = getXPath(pXmlDoc, "//draw:frame[2]//text:span[1]", "style-name"); + OString xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + CPPUNIT_ASSERT_EQUAL(OUString("TimesNewRoman"), + getXPath(pXmlDoc, xpath, "font-family").replaceAll(u" ", u"")); + + /* Test for the "TOTAL ESTA HOJA USD" paragraph" */ + styleName = getXPath(pXmlDoc, "//draw:frame[last()-1]//text:span[1]", "style-name"); + xpath = "//office:automatic-styles/style:style[@style:name=\"" + + OUStringToOString(styleName, RTL_TEXTENCODING_UTF8) + + "\"]/style:text-properties"; + CPPUNIT_ASSERT_EQUAL(OUString("TimesNewRoman"), + getXPath(pXmlDoc, xpath, "font-family").replaceAll(u" ", u"")); + CPPUNIT_ASSERT_EQUAL(OUString("bold"), + getXPath(pXmlDoc, xpath, "font-weight")); + } + + void testTdf104597_textrun() + { +#if HAVE_FEATURE_POPPLER + rtl::Reference xAdaptor(new pdfi::PDFIRawAdaptor(OUString(), getComponentContext())); + xAdaptor->setTreeVisitorFactory(createDrawTreeVisitorFactory()); + + OString aOutput; + CPPUNIT_ASSERT_MESSAGE("Converting PDF to ODF XML", + xAdaptor->odfConvert(m_directories.getURLFromSrc(u"/sdext/source/pdfimport/test/testdocs/tdf104597_textrun.pdf"), + new OutputWrapString(aOutput), + nullptr)); + + xmlDocUniquePtr pXmlDoc(xmlParseDoc(reinterpret_cast(aOutput.getStr()))); + + // Test for امُ عَلَيْكَ + OString xpath = "string(//draw:frame[@draw:transform='matrix(917.222222222222 0 0 917.222222222222 14821.9583333333 2159.23861112778)']/draw:text-box/text:p/text:span)"; + OUString sContent = getXPathContent(pXmlDoc, xpath); + CPPUNIT_ASSERT_EQUAL_MESSAGE(aOutput.getStr(), OUString(u"امُ عَلَيَْك"), sContent.replaceAll("\n\n", " ").replaceAll("\n", "")); + + // Test for ٱلسََّل . It appears in the 3rd frame, i.e. after the امُ عَلَيَْك which is in the 2nd frame (from left to right) + // thus these two frames together appear as ٱلسََّل امُ عَلَيْكَ in Draw‬. + // FIXME: Should be ٱلسَّلَامُ عَلَيْكَ (i.e. the two text frames should be merged into one so that the ل and the ا will show as لَا rather than ل ا) + xpath = "string(//draw:frame[@draw:transform='matrix(917.222222222222 0 0 917.222222222222 17420.1666666667 2159.23861112778)']/draw:text-box/text:p/text:span)"; + sContent = getXPathContent(pXmlDoc, xpath); + CPPUNIT_ASSERT_EQUAL_MESSAGE(aOutput.getStr(), OUString(u"ٱلسََّل"), sContent.replaceAll("\n\n", " ").replaceAll("\n", "")); + + // Test for "LibreOffice RTL" + xpath = "string(//draw:frame[@draw:transform='matrix(917.222222222222 0 0 917.222222222222 12779.375 5121.79583335)']/draw:text-box/text:p/text:span)"; + sContent = getXPathContent(pXmlDoc, xpath); + CPPUNIT_ASSERT_EQUAL_MESSAGE(aOutput.getStr(), OUString(u"LibreOffice RTL"), sContent.replaceAll("\n\n", " ").replaceAll("\n", "")); + + // Test for "LibreOffice LTR (test)" + xpath = "string(//draw:frame[last()-1]/draw:text-box/text:p/text:span[last()])"; + sContent = getXPathContent(pXmlDoc, xpath); + CPPUNIT_ASSERT_EQUAL_MESSAGE(aOutput.getStr(), OUString(u"LibreOffice LTR (test)"), sContent.replaceAll("\n\n", " ").replaceAll("\n", "")); + + /* Test for Chinese characters */ + // Use last() instead of matrix below, because the matrix may be different on different OS due to fallback of Chinese fonts. + xpath = "string(//draw:frame[last()]/draw:text-box/text:p/text:span)"; + sContent = getXPathContent(pXmlDoc, xpath); + CPPUNIT_ASSERT_EQUAL_MESSAGE(aOutput.getStr(), OUString(u"中文测试,中文"), sContent.replaceAll("\n\n", " ").replaceAll("\n", "")); + + // Test pdf text run in the Writer PDF import filter + xAdaptor->setTreeVisitorFactory(createWriterTreeVisitorFactory()); + OString aOutput2; + xAdaptor->odfConvert(m_directories.getURLFromSrc(u"/sdext/source/pdfimport/test/testdocs/tdf104597_textrun.pdf"), + new OutputWrapString(aOutput2), + nullptr); + xmlDocUniquePtr pXmlDoc2(xmlParseDoc(reinterpret_cast(aOutput2.getStr()))); + xpath = "string(//draw:frame[@draw:z-index='3'][1]/draw:text-box/text:p/text:span)"; + sContent = getXPathContent(pXmlDoc2, xpath).replaceAll("\n\n", " ").replaceAll("\n", ""); + CPPUNIT_ASSERT_EQUAL_MESSAGE(aOutput2.getStr(), OUString(u"ٱلَّسَل"), sContent); + xpath = "string(//draw:frame[@draw:z-index='2'][1]/draw:text-box/text:p/text:span)"; + sContent = getXPathContent(pXmlDoc2, xpath).replaceAll("\n\n", " ").replaceAll("\n", ""); + CPPUNIT_ASSERT_EQUAL(true, sContent.match(u"اُم َعَلْيَك")); + xpath = "string(//draw:frame[last()]/draw:text-box/text:p/text:span)"; + sContent = getXPathContent(pXmlDoc2, xpath).replaceAll("\n\n", " ").replaceAll("\n", ""); + CPPUNIT_ASSERT_EQUAL_MESSAGE(aOutput2.getStr(), OUString(u"中文测试,中文"), sContent); +#endif + } + + void testSpaces() + { +#if HAVE_FEATURE_POPPLER + rtl::Reference xAdaptor(new pdfi::PDFIRawAdaptor(OUString(), getComponentContext())); + xAdaptor->setTreeVisitorFactory(createWriterTreeVisitorFactory()); + + OString aOutput; + xAdaptor->odfConvert(m_directories.getURLFromSrc(u"/sdext/source/pdfimport/test/testdocs/testSpace.pdf"), + new OutputWrapString(aOutput), + nullptr); + xmlDocUniquePtr pXmlDoc(xmlParseDoc(reinterpret_cast(aOutput.getStr()))); + + // Space test: there are 10 spaces, each space is expressed as a , + // thus the 10th text:s should exist and the attribute "text:c" should be "1". + OString xpath = "//draw:frame[@draw:z-index='1'][1]/draw:text-box/text:p/text:span/text:s[10]"; + OUString sContent = getXPath(pXmlDoc, xpath, "c"); + CPPUNIT_ASSERT_EQUAL_MESSAGE(aOutput.getStr(), OUString("1"), sContent); + + // Tab test: there are 10 tabs. Text before and after the tabs are shown in different draw frames. + // With the Liberation Serif font, the horizontal position of the first frame is 20.03mm and the + // second frame is 94.12mm. + xpath = "//draw:frame[@draw:z-index='2'][1]"; + sContent = getXPath(pXmlDoc, xpath, "transform"); + CPPUNIT_ASSERT_EQUAL_MESSAGE(aOutput.getStr(), OUString("translate( 20.03mm 25.05mm )"), sContent); + xpath = "//draw:frame[@draw:z-index='3'][1]"; + sContent = getXPath(pXmlDoc, xpath, "transform"); + CPPUNIT_ASSERT_EQUAL_MESSAGE(aOutput.getStr(), OUString("translate( 94.12mm 25.05mm )"), sContent); + + // Non-breaking space test: there are 10 NBSpaces, which are treated as the same as normal space in PDF, + // thus each is expressed as a . + // The 10th text:s should exist and the attribute "text:c" should be "1". + xpath = "//draw:frame[@draw:z-index='4'][1]/draw:text-box/text:p/text:span/text:s[10]"; + sContent = getXPath(pXmlDoc, xpath, "c"); + CPPUNIT_ASSERT_EQUAL_MESSAGE(aOutput.getStr(), OUString("1"), sContent); +#endif + } + + CPPUNIT_TEST_SUITE(PDFITest); + CPPUNIT_TEST(testXPDFParser); + CPPUNIT_TEST(testOdfWriterExport); + CPPUNIT_TEST(testOdfDrawExport); + CPPUNIT_TEST(testTdf96993); + CPPUNIT_TEST(testTdf98421); + CPPUNIT_TEST(testTdf105536); + CPPUNIT_TEST(testTdf141709); + CPPUNIT_TEST(testTdf78427_FontFeatures); + CPPUNIT_TEST(testTdf78427_FontWeight_MyraidProSemibold); + CPPUNIT_TEST(testTdf143959_nameFromFontFile); + CPPUNIT_TEST(testTdf104597_textrun); + CPPUNIT_TEST(testSpaces); + CPPUNIT_TEST_SUITE_END(); + }; + +} + +CPPUNIT_TEST_SUITE_REGISTRATION(PDFITest); + +CPPUNIT_PLUGIN_IMPLEMENT(); + +/* vim:set shiftwidth=4 softtabstop=4 expandtab: */ -- cgit v1.2.3