1 /* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
3 * This file is part of the LibreOffice project.
5 * This Source Code Form is subject to the terms of the Mozilla Public
6 * License, v. 2.0. If a copy of the MPL was not distributed with this
7 * file, You can obtain one at http://mozilla.org/MPL/2.0/.
9 * This file incorporates work covered by the following license notice:
11 * Licensed to the Apache Software Foundation (ASF) under one or more
12 * contributor license agreements. See the NOTICE file distributed
13 * with this work for additional information regarding copyright
14 * ownership. The ASF licenses this file to you under the Apache
15 * License, Version 2.0 (the "License"); you may not use this file
16 * except in compliance with the License. You may obtain a copy of
17 * the License at http://www.apache.org/licenses/LICENSE-2.0 .
20 #include "swdetect.hxx"
22 #include <cppuhelper/supportsservice.hxx>
23 #include <com/sun/star/io/XInputStream.hpp>
24 #include <com/sun/star/uno/XComponentContext.hpp>
25 #include <sfx2/docfile.hxx>
26 #include <sot/storage.hxx>
27 #include <tools/urlobj.hxx>
28 #include <unotools/mediadescriptor.hxx>
30 using namespace ::com::sun::star
;
31 using namespace ::com::sun::star::uno
;
32 using namespace ::com::sun::star::io
;
33 using namespace ::com::sun::star::task
;
34 using namespace ::com::sun::star::beans
;
35 using namespace ::com::sun::star::lang
;
36 using utl::MediaDescriptor
;
38 SwFilterDetect::SwFilterDetect()
42 SwFilterDetect::~SwFilterDetect()
46 OUString SAL_CALL
SwFilterDetect::detect( Sequence
< PropertyValue
>& lDescriptor
)
48 MediaDescriptor
aMediaDesc( lDescriptor
);
49 OUString aTypeName
= aMediaDesc
.getUnpackedValueOrDefault( MediaDescriptor::PROP_TYPENAME
, OUString() );
50 uno::Reference
< io::XInputStream
> xInStream ( aMediaDesc
[MediaDescriptor::PROP_INPUTSTREAM
], uno::UNO_QUERY
);
51 if ( !xInStream
.is() )
55 aMedium
.UseInteractionHandler( false );
56 aMedium
.setStreamToLoadFrom( xInStream
, true );
58 SvStream
*pInStrm
= aMedium
.GetInStream();
59 if ( !pInStrm
|| pInStrm
->GetError() )
62 bool bIsDetected
= false;
64 if ( aTypeName
== "writer_Rich_Text_Format" )
66 pInStrm
->Seek( STREAM_SEEK_TO_BEGIN
);
67 bIsDetected
= ( read_uInt8s_ToOString( *pInStrm
, 5 ) == "{\\rtf" );
69 else if ( aTypeName
== "writer_MS_WinWord_5" )
71 pInStrm
->Seek( STREAM_SEEK_TO_BEGIN
);
72 const sal_uInt8 nBufSize
= 3;
73 sal_uInt8 nBuffer
[ nBufSize
];
74 if (pInStrm
->ReadBytes(nBuffer
, nBufSize
) < nBufSize
)
77 bIsDetected
= (nBuffer
[0] == 0x9B && nBuffer
[1] == 0xA5 && nBuffer
[2] == 0x21) // WinWord 1
78 || (nBuffer
[0] == 0x9C && nBuffer
[1] == 0xA5 && nBuffer
[2] == 0x21) // PMWord 1
79 || (nBuffer
[0] == 0xDB && nBuffer
[1] == 0xA5 && nBuffer
[2] == 0x2D) // WinWord 2
80 || (nBuffer
[0] == 0xDC && nBuffer
[1] == 0xA5 && nBuffer
[2] == 0x65); // WinWord 6.0/95, as a single stream file
84 // Do not attempt to create an SotStorage on a
85 // 0-length stream as that would create the compound
86 // document header on the stream and effectively write to
88 pInStrm
->Seek( STREAM_SEEK_TO_BEGIN
);
89 if ( pInStrm
->remainingSize() == 0 )
94 rtl::Reference
<SotStorage
> aStorage
= new SotStorage ( pInStrm
, false );
95 if ( !aStorage
->GetError() )
97 bIsDetected
= aStorage
->IsContained( u
"WordDocument"_ustr
);
98 if ( bIsDetected
&& aTypeName
.startsWith( "writer_MS_Word_97" ) )
100 bIsDetected
= ( aStorage
->IsContained(u
"0Table"_ustr
) || aStorage
->IsContained(u
"1Table"_ustr
) );
102 // If we are checking the template type, and the document is not a .dot, don't
104 if ( bIsDetected
&& aTypeName
== "writer_MS_Word_97_Vorlage" )
106 // It is common practice to rename a .doc to .dot to make it a template.
107 // Since we have detected a.doc-ish format, always accept .dot-named-files
108 // as valid templates to avoid flagging this as an invalid .dot format..
109 INetURLObject
aParser(aMediaDesc
.getUnpackedValueOrDefault(
110 utl::MediaDescriptor::PROP_URL
, OUString()));
112 // Super ugly hack, but we don't want to use the whole WW8Fib thing here in
113 // the swd library, apparently. We know (do we?) that the "aBits1" byte, as
114 // the variable is called in WW8Fib::WW8Fib(SvStream&,sal_uInt8,sal_uInt32),
115 // is at offset 10 in the WordDocument stream. The fDot bit is bit 0x01 of
117 if (aParser
.getExtension().toAsciiLowerCase() != "dot")
119 rtl::Reference
<SotStorageStream
> xWordDocument
120 = aStorage
->OpenSotStream(u
"WordDocument"_ustr
, StreamMode::STD_READ
);
121 xWordDocument
->Seek(10);
122 if (xWordDocument
->Tell() == 10)
125 xWordDocument
->ReadUChar(aBits1
);
127 bIsDetected
= ((aBits1
& 0x01) == 0x01);
147 OUString SAL_CALL
SwFilterDetect::getImplementationName()
149 return u
"com.sun.star.comp.writer.FormatDetector"_ustr
;
153 sal_Bool SAL_CALL
SwFilterDetect::supportsService( const OUString
& sServiceName
)
155 return cppu::supportsService(this, sServiceName
);
159 Sequence
< OUString
> SAL_CALL
SwFilterDetect::getSupportedServiceNames()
161 return { u
"com.sun.star.frame.ExtendedTypeDetection"_ustr
, u
"com.sun.star.text.FormatDetector"_ustr
, u
"com.sun.star.text.W4WFormatDetector"_ustr
};
164 extern "C" SAL_DLLPUBLIC_EXPORT
css::uno::XInterface
*
165 com_sun_star_comp_writer_FormatDetector_get_implementation(css::uno::XComponentContext
*,
166 css::uno::Sequence
<css::uno::Any
> const &)
168 return cppu::acquire(new SwFilterDetect());
171 /* vim:set shiftwidth=4 softtabstop=4 expandtab: */