1 /**************************************************************
2  *
3  * Licensed to the Apache Software Foundation (ASF) under one
4  * or more contributor license agreements.  See the NOTICE file
5  * distributed with this work for additional information
6  * regarding copyright ownership.  The ASF licenses this file
7  * to you under the Apache License, Version 2.0 (the
8  * "License"); you may not use this file except in compliance
9  * with the License.  You may obtain a copy of the License at
10  *
11  *   http://www.apache.org/licenses/LICENSE-2.0
12  *
13  * Unless required by applicable law or agreed to in writing,
14  * software distributed under the License is distributed on an
15  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
16  * KIND, either express or implied.  See the License for the
17  * specific language governing permissions and limitations
18  * under the License.
19  *
20  *************************************************************/
21 
22 
23 
24 // MARKER(update_precomp.py): autogen include statement, do not remove
25 #include "precompiled_sdext.hxx"
26 
27 #include "pdfiadaptor.hxx"
28 #include "filterdet.hxx"
29 #include "saxemitter.hxx"
30 #include "odfemitter.hxx"
31 #include "inc/wrapper.hxx"
32 #include "inc/contentsink.hxx"
33 #include "tree/pdfiprocessor.hxx"
34 
35 #include <osl/file.h>
36 #include <osl/thread.h>
37 #include <osl/diagnose.h>
38 #include <cppuhelper/factory.hxx>
39 #include <cppuhelper/implementationentry.hxx>
40 #include <com/sun/star/lang/XMultiComponentFactory.hpp>
41 #include <com/sun/star/uno/RuntimeException.hpp>
42 #include <com/sun/star/io/XInputStream.hpp>
43 #include <com/sun/star/frame/XLoadable.hpp>
44 #include <com/sun/star/xml/sax/XDocumentHandler.hpp>
45 #include <com/sun/star/io/XSeekable.hpp>
46 
47 
48 #include <boost/shared_ptr.hpp>
49 
50 using namespace com::sun::star;
51 
52 
53 namespace pdfi
54 {
55 
PDFIHybridAdaptor(const uno::Reference<uno::XComponentContext> & xContext)56 PDFIHybridAdaptor::PDFIHybridAdaptor( const uno::Reference< uno::XComponentContext >& xContext ) :
57 	PDFIHybridAdaptorBase( m_aMutex ),
58 	m_xContext( xContext ),
59 	m_xModel()
60 {
61 }
62 
63 // XFilter
filter(const uno::Sequence<beans::PropertyValue> & rFilterData)64 sal_Bool SAL_CALL PDFIHybridAdaptor::filter( const uno::Sequence< beans::PropertyValue >& rFilterData ) throw( uno::RuntimeException )
65 {
66     sal_Bool bRet = sal_False;
67     if( m_xModel.is() )
68     {
69         uno::Reference< io::XStream > xSubStream;
70         rtl::OUString aPwd;
71         const beans::PropertyValue* pAttribs = rFilterData.getConstArray();
72         sal_Int32 nAttribs = rFilterData.getLength();
73         sal_Int32 nPwPos = -1;
74         for( sal_Int32 i = 0; i < nAttribs; i++ )
75         {
76             #if OSL_DEBUG_LEVEL > 1
77             rtl::OUString aVal( RTL_CONSTASCII_USTRINGPARAM( "<no string>" ) );
78             pAttribs[i].Value >>= aVal;
79             OSL_TRACE( "filter: Attrib: %s = %s\n",
80                        rtl::OUStringToOString( pAttribs[i].Name, RTL_TEXTENCODING_UTF8 ).getStr(),
81                        rtl::OUStringToOString( aVal, RTL_TEXTENCODING_UTF8 ).getStr() );
82             #endif
83             if( pAttribs[i].Name.equalsAscii( "EmbeddedSubstream" ) )
84                 pAttribs[i].Value >>= xSubStream;
85             else if( pAttribs[i].Name.equalsAscii( "Password" ) )
86             {
87                 nPwPos = i;
88                 pAttribs[i].Value >>= aPwd;
89             }
90         }
91         bool bAddPwdProp = false;
92         if( ! xSubStream.is() )
93         {
94             uno::Reference< io::XInputStream > xInput;
95             for( sal_Int32 i = 0; i < nAttribs; i++ )
96             {
97                 if( pAttribs[i].Name.equalsAscii( "InputStream" ) )
98                 {
99                     pAttribs[i].Value >>= xInput;
100                     break;
101                 }
102             }
103             if( xInput.is() )
104             {
105 				// TODO(P2): extracting hybrid substream twice - once during detection, second time here
106                 uno::Reference< io::XSeekable > xSeek( xInput, uno::UNO_QUERY );
107                 if( xSeek.is() )
108                     xSeek->seek( 0 );
109                 oslFileHandle aFile = NULL;
110                 sal_uInt64 nWritten = 0;
111                 rtl::OUString aURL;
112                 if( osl_createTempFile( NULL, &aFile, &aURL.pData ) == osl_File_E_None )
113                 {
114                     OSL_TRACE( "created temp file %s\n", rtl::OUStringToOString( aURL, RTL_TEXTENCODING_UTF8 ).getStr() );
115                     const sal_Int32 nBufSize = 4096;
116                     uno::Sequence<sal_Int8> aBuf(nBufSize);
117                     // copy the bytes
118                     sal_Int32 nBytes;
119                     do
120                     {
121                         nBytes = xInput->readBytes( aBuf, nBufSize );
122                         if( nBytes > 0 )
123                         {
124                             osl_writeFile( aFile, aBuf.getConstArray(), nBytes, &nWritten );
125                             if( static_cast<sal_Int32>(nWritten) != nBytes )
126                             {
127                                 xInput.clear();
128                                 break;
129                             }
130                         }
131                     } while( nBytes == nBufSize );
132                     osl_closeFile( aFile );
133                     if( xInput.is() )
134                     {
135                         rtl::OUString aEmbedMimetype;
136                         rtl::OUString aOrgPwd( aPwd );
137                         xSubStream = getAdditionalStream( aURL, aEmbedMimetype, aPwd, m_xContext, rFilterData, true );
138                         if( aOrgPwd != aPwd )
139                             bAddPwdProp = true;
140                     }
141                     osl_removeFile( aURL.pData );
142                 }
143                 else
144                     xSubStream.clear();
145             }
146         }
147         if( xSubStream.is() )
148         {
149             uno::Sequence< uno::Any > aArgs( 2 );
150             aArgs[0] <<= m_xModel;
151             aArgs[1] <<= xSubStream;
152 
153             OSL_TRACE( "try to instantiate subfilter\n" );
154             uno::Reference< document::XFilter > xSubFilter;
155             try {
156                 xSubFilter = uno::Reference<document::XFilter>(
157                     m_xContext->getServiceManager()->createInstanceWithArgumentsAndContext(
158                         rtl::OUString( RTL_CONSTASCII_USTRINGPARAM( "com.sun.star.document.OwnSubFilter" ) ),
159                         aArgs,
160                         m_xContext ),
161                     uno::UNO_QUERY );
162             }
163             catch(uno::Exception& e)
164             {
165                 (void)e;
166                 OSL_TRACE( "subfilter exception: %s\n",
167                            OUStringToOString( e.Message, RTL_TEXTENCODING_UTF8 ).getStr() );
168             }
169 
170             OSL_TRACE( "subfilter: %p\n", xSubFilter.get() );
171             if( xSubFilter.is() )
172             {
173                 if( bAddPwdProp )
174                 {
175                     uno::Sequence<beans::PropertyValue> aFilterData( rFilterData );
176                     if( nPwPos == -1 )
177                     {
178                         nPwPos = aFilterData.getLength();
179                         aFilterData.realloc( nPwPos+1 );
180                         aFilterData[nPwPos].Name = rtl::OUString(
181                             RTL_CONSTASCII_USTRINGPARAM( "Password" ) );
182                     }
183                     aFilterData[nPwPos].Value <<= aPwd;
184                     bRet = xSubFilter->filter( aFilterData );
185                 }
186                 else
187                     bRet = xSubFilter->filter( rFilterData );
188             }
189         }
190         #if OSL_DEBUG_LEVEL > 1
191         else
192             OSL_TRACE( "PDFIAdaptor::filter: no embedded substream set\n" );
193         #endif
194     }
195     #if OSL_DEBUG_LEVEL > 1
196     else
197         OSL_TRACE( "PDFIAdaptor::filter: no model set\n" );
198     #endif
199 
200     return bRet;
201 }
202 
cancel()203 void SAL_CALL PDFIHybridAdaptor::cancel() throw()
204 {
205 }
206 
207 //XImporter
setTargetDocument(const uno::Reference<lang::XComponent> & xDocument)208 void SAL_CALL PDFIHybridAdaptor::setTargetDocument( const uno::Reference< lang::XComponent >& xDocument ) throw( lang::IllegalArgumentException )
209 {
210     OSL_TRACE( "PDFIAdaptor::setTargetDocument\n" );
211     m_xModel = uno::Reference< frame::XModel >( xDocument, uno::UNO_QUERY );
212     if( xDocument.is() && ! m_xModel.is() )
213         throw lang::IllegalArgumentException();
214 }
215 
216 //---------------------------------------------------------------------------------------
217 
PDFIRawAdaptor(const uno::Reference<uno::XComponentContext> & xContext)218 PDFIRawAdaptor::PDFIRawAdaptor( const uno::Reference< uno::XComponentContext >& xContext ) :
219     PDFIAdaptorBase( m_aMutex ),
220     m_xContext( xContext ),
221     m_xModel(),
222     m_pVisitorFactory(),
223     m_bEnableToplevelText(false)
224 {
225 }
226 
setTreeVisitorFactory(const TreeVisitorFactorySharedPtr & rVisitorFactory)227 void PDFIRawAdaptor::setTreeVisitorFactory(const TreeVisitorFactorySharedPtr& rVisitorFactory)
228 {
229     m_pVisitorFactory = rVisitorFactory;
230 }
231 
parse(const uno::Reference<io::XInputStream> & xInput,const uno::Reference<task::XInteractionHandler> & xIHdl,const rtl::OUString & rPwd,const uno::Reference<task::XStatusIndicator> & xStatus,const XmlEmitterSharedPtr & rEmitter,const rtl::OUString & rURL)232 bool PDFIRawAdaptor::parse( const uno::Reference<io::XInputStream>&       xInput,
233                             const uno::Reference<task::XInteractionHandler>& xIHdl,
234                             const rtl::OUString&                          rPwd,
235                             const uno::Reference<task::XStatusIndicator>& xStatus,
236                             const XmlEmitterSharedPtr&                    rEmitter,
237                             const rtl::OUString&                          rURL )
238 {
239     // container for metaformat
240     boost::shared_ptr<PDFIProcessor> pSink(
241         new PDFIProcessor(xStatus, m_xContext));
242 
243     // TEMP! TEMP!
244     if( m_bEnableToplevelText )
245         pSink->enableToplevelText();
246 
247     bool bSuccess=false;
248 
249     if( xInput.is() && (!rURL.getLength() || rURL.compareToAscii( "file:", 5 ) != 0) )
250         bSuccess = xpdf_ImportFromStream( xInput, pSink, xIHdl, rPwd, m_xContext );
251     else
252         bSuccess = xpdf_ImportFromFile( rURL, pSink, xIHdl, rPwd, m_xContext );
253 
254     if( bSuccess )
255         pSink->emit(*rEmitter,*m_pVisitorFactory);
256 
257     return bSuccess;
258 }
259 
odfConvert(const rtl::OUString & rURL,const uno::Reference<io::XOutputStream> & xOutput,const uno::Reference<task::XStatusIndicator> & xStatus)260 bool PDFIRawAdaptor::odfConvert( const rtl::OUString&                          rURL,
261                                  const uno::Reference<io::XOutputStream>&      xOutput,
262                                  const uno::Reference<task::XStatusIndicator>& xStatus )
263 {
264     XmlEmitterSharedPtr pEmitter = createOdfEmitter(xOutput);
265     const bool bSuccess = parse(uno::Reference<io::XInputStream>(),
266                                 uno::Reference<task::XInteractionHandler>(),
267                                 rtl::OUString(),
268                                 xStatus,pEmitter,rURL);
269 
270     // tell input stream that it is no longer needed
271 	xOutput->closeOutput();
272 
273     return bSuccess;
274 }
275 
276 // XImportFilter
importer(const uno::Sequence<beans::PropertyValue> & rSourceData,const uno::Reference<xml::sax::XDocumentHandler> & rHdl,const uno::Sequence<rtl::OUString> &)277 sal_Bool SAL_CALL PDFIRawAdaptor::importer( const uno::Sequence< beans::PropertyValue >&        rSourceData,
278                                             const uno::Reference< xml::sax::XDocumentHandler >& rHdl,
279                                             const uno::Sequence< rtl::OUString >&               /*rUserData*/ ) throw( uno::RuntimeException )
280 {
281     // get the InputStream carrying the PDF content
282     uno::Reference< io::XInputStream > xInput;
283     uno::Reference< task::XStatusIndicator > xStatus;
284     uno::Reference< task::XInteractionHandler > xInteractionHandler;
285     rtl::OUString aURL;
286     rtl::OUString aPwd;
287     const beans::PropertyValue* pAttribs = rSourceData.getConstArray();
288     sal_Int32 nAttribs = rSourceData.getLength();
289     for( sal_Int32 i = 0; i < nAttribs; i++, pAttribs++ )
290     {
291         OSL_TRACE("importer Attrib: %s\n", OUStringToOString( pAttribs->Name, RTL_TEXTENCODING_UTF8 ).getStr() );
292         if( pAttribs->Name.equalsAscii( "InputStream" ) )
293             pAttribs->Value >>= xInput;
294         else if( pAttribs->Name.equalsAscii( "URL" ) )
295             pAttribs->Value >>= aURL;
296         else if( pAttribs->Name.equalsAscii( "StatusIndicator" ) )
297             pAttribs->Value >>= xStatus;
298         else if( pAttribs->Name.equalsAscii( "InteractionHandler" ) )
299             pAttribs->Value >>= xInteractionHandler;
300         else if( pAttribs->Name.equalsAscii( "Password" ) )
301             pAttribs->Value >>= aPwd;
302     }
303     if( !xInput.is() )
304         return sal_False;
305 
306     XmlEmitterSharedPtr pEmitter = createSaxEmitter(rHdl);
307     const bool bSuccess = parse(xInput,xInteractionHandler, aPwd, xStatus,pEmitter,aURL);
308 
309     // tell input stream that it is no longer needed
310     xInput->closeInput();
311     xInput.clear();
312 
313     return bSuccess;
314 }
315 
316 //XImporter
setTargetDocument(const uno::Reference<lang::XComponent> & xDocument)317 void SAL_CALL PDFIRawAdaptor::setTargetDocument( const uno::Reference< lang::XComponent >& xDocument ) throw( lang::IllegalArgumentException )
318 {
319     OSL_TRACE( "PDFIAdaptor::setTargetDocument\n" );
320     m_xModel = uno::Reference< frame::XModel >( xDocument, uno::UNO_QUERY );
321     if( xDocument.is() && ! m_xModel.is() )
322         throw lang::IllegalArgumentException();
323 }
324 
325 }
326