LibreOffice Module sax (master) 1
legacyfastparser.cxx
Go to the documentation of this file.
1/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
2/*
3 * This file is part of the LibreOffice project.
4 *
5 * This Source Code Form is subject to the terms of the Mozilla Public
6 * License, v. 2.0. If a copy of the MPL was not distributed with this
7 * file, You can obtain one at http://mozilla.org/MPL/2.0/.
8 *
9 * This file incorporates work covered by the following license notice:
10 *
11 * Licensed to the Apache Software Foundation (ASF) under one or more
12 * contributor license agreements. See the NOTICE file distributed
13 * with this work for additional information regarding copyright
14 * ownership. The ASF licenses this file to you under the Apache
15 * License, Version 2.0 (the "License"); you may not use this file
16 * except in compliance with the License. You may obtain a copy of
17 * the License at http://www.apache.org/licenses/LICENSE-2.0 .
18 */
19
20#include <com/sun/star/lang/XServiceInfo.hpp>
21#include <com/sun/star/xml/sax/XParser.hpp>
22#include <com/sun/star/xml/sax/FastParser.hpp>
23#include <com/sun/star/lang/XInitialization.hpp>
24#include <com/sun/star/beans/Pair.hpp>
28#include <rtl/ref.hxx>
29#include <memory>
30#include <utility>
31#include <vector>
32
33using namespace ::cppu;
34using namespace css;
35using namespace uno;
36using namespace lang;
37using namespace xml::sax;
38using namespace io;
39
40namespace {
41
42class NamespaceHandler : public WeakImplHelper< XFastNamespaceHandler >
43{
44private:
45 struct NamespaceDefine
46 {
47 OUString m_aPrefix;
48 OUString m_aNamespaceURI;
49
50 NamespaceDefine( OUString aPrefix, OUString aNamespaceURI ) : m_aPrefix(std::move( aPrefix )), m_aNamespaceURI(std::move( aNamespaceURI )) {}
51 };
52 std::vector< std::unique_ptr< NamespaceDefine > > m_aNamespaceDefines;
53
54public:
55 NamespaceHandler();
56 void addNSDeclAttributes( rtl::Reference < comphelper::AttributeList > const & rAttrList );
57
58 //XFastNamespaceHandler
59 virtual void SAL_CALL registerNamespace( const OUString& rNamespacePrefix, const OUString& rNamespaceURI ) override;
60 virtual OUString SAL_CALL getNamespaceURI( const OUString& rNamespacePrefix ) override;
61};
62
63NamespaceHandler::NamespaceHandler()
64{
65}
66
67void NamespaceHandler::addNSDeclAttributes( rtl::Reference < comphelper::AttributeList > const & rAttrList )
68{
69 for(const auto& aNamespaceDefine : m_aNamespaceDefines)
70 {
71 OUString& rPrefix = aNamespaceDefine->m_aPrefix;
72 OUString& rNamespaceURI = aNamespaceDefine->m_aNamespaceURI;
73 OUString sDecl;
74 if ( rPrefix.isEmpty() )
75 sDecl = "xmlns";
76 else
77 sDecl = "xmlns:" + rPrefix;
78 rAttrList->AddAttribute( sDecl, rNamespaceURI );
79 }
80 m_aNamespaceDefines.clear();
81}
82
83void NamespaceHandler::registerNamespace( const OUString& rNamespacePrefix, const OUString& rNamespaceURI )
84{
85 m_aNamespaceDefines.push_back( std::make_unique<NamespaceDefine>(
86 rNamespacePrefix, rNamespaceURI) );
87}
88
89OUString NamespaceHandler::getNamespaceURI( const OUString&/* rNamespacePrefix */ )
90{
91 return OUString();
92}
93
94class SaxLegacyFastParser : public WeakImplHelper< XInitialization, XServiceInfo, XParser >
95{
96private:
97 rtl::Reference< NamespaceHandler > m_aNamespaceHandler;
98public:
99 SaxLegacyFastParser();
100
101// css::lang::XInitialization:
102 virtual void SAL_CALL initialize(css::uno::Sequence<css::uno::Any> const& rArguments) override;
103
104// The SAX-Parser-Interface
105 virtual void SAL_CALL parseStream( const InputSource& structSource) override;
106 virtual void SAL_CALL setDocumentHandler(const Reference< XDocumentHandler > & xHandler) override;
107 virtual void SAL_CALL setErrorHandler(const Reference< XErrorHandler > & xHandler) override;
108 virtual void SAL_CALL setDTDHandler(const Reference < XDTDHandler > & xHandler) override;
109 virtual void SAL_CALL setEntityResolver(const Reference< XEntityResolver >& xResolver) override;
110 virtual void SAL_CALL setLocale( const Locale &locale ) override;
111
112// XServiceInfo
113 OUString SAL_CALL getImplementationName() override;
114 Sequence< OUString > SAL_CALL getSupportedServiceNames() override;
115 sal_Bool SAL_CALL supportsService(const OUString& ServiceName) override;
116
117private:
118 Reference< XFastParser > m_xParser;
119 Reference< XDocumentHandler > m_xDocumentHandler;
120 Reference< XFastTokenHandler > m_xTokenHandler;
121
122};
123
124
125class CallbackDocumentHandler : public WeakImplHelper< XFastDocumentHandler >
126{
127private:
128 Reference< XDocumentHandler > m_xDocumentHandler;
129 Reference< XFastTokenHandler > m_xTokenHandler;
130 rtl::Reference< NamespaceHandler > m_aNamespaceHandler;
131 OUString getNamespacePrefixFromToken( sal_Int32 nToken );
132 OUString getNameFromToken( sal_Int32 nToken );
133
134 static constexpr OUStringLiteral aDefaultNamespace = u"";
135 static constexpr OUStringLiteral aNamespaceSeparator = u":";
136
137public:
138 CallbackDocumentHandler( Reference< XDocumentHandler > const & xDocumentHandler,
139 rtl::Reference< NamespaceHandler > const & rNamespaceHandler,
140 Reference< XFastTokenHandler > const & xTokenHandler);
141
142 // XFastDocumentHandler
143 virtual void SAL_CALL startDocument() override;
144 virtual void SAL_CALL endDocument() override;
145 virtual void SAL_CALL processingInstruction( const OUString& rTarget, const OUString& rData ) override;
146 virtual void SAL_CALL setDocumentLocator( const Reference< XLocator >& xLocator ) override;
147
148 // XFastContextHandler
149 virtual void SAL_CALL startFastElement( sal_Int32 nElement, const Reference< XFastAttributeList >& Attribs ) override;
150 virtual void SAL_CALL startUnknownElement( const OUString& Namespace, const OUString& Name, const Reference< XFastAttributeList >& Attribs ) override;
151 virtual void SAL_CALL endFastElement( sal_Int32 Element ) override;
152 virtual void SAL_CALL endUnknownElement( const OUString& Namespace, const OUString& Name ) override;
153 virtual Reference< XFastContextHandler > SAL_CALL createFastChildContext( sal_Int32 nElement, const Reference< XFastAttributeList >& Attribs ) override;
154 virtual Reference< XFastContextHandler > SAL_CALL createUnknownChildContext( const OUString& Namespace, const OUString& Name, const Reference< XFastAttributeList >& Attribs ) override;
155 virtual void SAL_CALL characters( const OUString& aChars ) override;
156
157};
158
159OUString CallbackDocumentHandler::getNamespacePrefixFromToken( sal_Int32 nToken )
160{
161 if ( ( nToken & 0xffff0000 ) != 0 )
162 {
163 Sequence< sal_Int8 > aSeq = m_xTokenHandler->getUTF8Identifier( nToken & 0xffff0000 );
164 return OUString( reinterpret_cast< const char* >(
165 aSeq.getConstArray() ), aSeq.getLength(), RTL_TEXTENCODING_UTF8 );
166 }
167 else
168 return OUString();
169}
170
171OUString CallbackDocumentHandler::getNameFromToken( sal_Int32 nToken )
172{
173 Sequence< sal_Int8 > aSeq = m_xTokenHandler->getUTF8Identifier( nToken & 0xffff );
174 return OUString( reinterpret_cast< const char* >(
175 aSeq.getConstArray() ), aSeq.getLength(), RTL_TEXTENCODING_UTF8 );
176}
177
178CallbackDocumentHandler::CallbackDocumentHandler( Reference< XDocumentHandler > const & xDocumentHandler,
179 rtl::Reference< NamespaceHandler > const & rNamespaceHandler,
180 Reference< XFastTokenHandler > const & xTokenHandler)
181{
182 m_xDocumentHandler.set( xDocumentHandler );
183 m_aNamespaceHandler = rNamespaceHandler;
184 m_xTokenHandler.set( xTokenHandler );
185}
186
187void SAL_CALL CallbackDocumentHandler::startDocument()
188{
189 if ( m_xDocumentHandler.is() )
190 m_xDocumentHandler->startDocument();
191}
192
193void SAL_CALL CallbackDocumentHandler::endDocument()
194{
195 if ( m_xDocumentHandler.is() )
196 m_xDocumentHandler->endDocument();
197}
198
199void SAL_CALL CallbackDocumentHandler::processingInstruction( const OUString& rTarget, const OUString& rData )
200{
201 if ( m_xDocumentHandler.is() )
202 m_xDocumentHandler->processingInstruction( rTarget, rData );
203}
204
205void SAL_CALL CallbackDocumentHandler::setDocumentLocator( const Reference< XLocator >& xLocator )
206{
207 if ( m_xDocumentHandler.is() )
208 m_xDocumentHandler->setDocumentLocator( xLocator );
209}
210
211void SAL_CALL CallbackDocumentHandler::startFastElement( sal_Int32 nElement , const Reference< XFastAttributeList >& Attribs )
212{
213 const OUString& rPrefix = CallbackDocumentHandler::getNamespacePrefixFromToken( nElement );
214 const OUString& rLocalName = CallbackDocumentHandler::getNameFromToken( nElement );
215 startUnknownElement( aDefaultNamespace, (rPrefix.isEmpty())? rLocalName : rPrefix + aNamespaceSeparator + rLocalName, Attribs );
216}
217
218void SAL_CALL CallbackDocumentHandler::startUnknownElement( const OUString& /*Namespace*/, const OUString& Name, const Reference< XFastAttributeList >& Attribs )
219{
220 if ( !m_xDocumentHandler.is() )
221 return;
222
224 m_aNamespaceHandler->addNSDeclAttributes( rAttrList );
225
226 const Sequence< xml::FastAttribute > fastAttribs = Attribs->getFastAttributes();
227 for (const auto& rAttr : fastAttribs)
228 {
229 const OUString& rAttrValue = rAttr.Value;
230 sal_Int32 nToken = rAttr.Token;
231 const OUString& rAttrNamespacePrefix = CallbackDocumentHandler::getNamespacePrefixFromToken( nToken );
232 OUString sAttrName = CallbackDocumentHandler::getNameFromToken( nToken );
233 if ( !rAttrNamespacePrefix.isEmpty() )
234 sAttrName = rAttrNamespacePrefix + aNamespaceSeparator + sAttrName;
235
236 rAttrList->AddAttribute( sAttrName, rAttrValue );
237 }
238
239 const Sequence< xml::Attribute > unknownAttribs = Attribs->getUnknownAttributes();
240 for (const auto& rAttr : unknownAttribs)
241 {
242 const OUString& rAttrValue = rAttr.Value;
243 const OUString& rAttrName = rAttr.Name;
244
245 rAttrList->AddAttribute( rAttrName, rAttrValue );
246 }
247 m_xDocumentHandler->startElement( Name, rAttrList );
248}
249
250void SAL_CALL CallbackDocumentHandler::endFastElement( sal_Int32 nElement )
251{
252 const OUString& rPrefix = CallbackDocumentHandler::getNamespacePrefixFromToken( nElement );
253 const OUString& rLocalName = CallbackDocumentHandler::getNameFromToken( nElement );
254 endUnknownElement( aDefaultNamespace, (rPrefix.isEmpty())? rLocalName : rPrefix + aNamespaceSeparator + rLocalName );
255}
256
257
258void SAL_CALL CallbackDocumentHandler::endUnknownElement( const OUString& /*Namespace*/, const OUString& Name )
259{
260 if ( m_xDocumentHandler.is() )
261 {
262 m_xDocumentHandler->endElement( Name );
263 }
264}
265
266Reference< XFastContextHandler > SAL_CALL CallbackDocumentHandler::createFastChildContext( sal_Int32/* nElement */, const Reference< XFastAttributeList >&/* Attribs */ )
267{
268 return this;
269}
270
271
272Reference< XFastContextHandler > SAL_CALL CallbackDocumentHandler::createUnknownChildContext( const OUString&/* Namespace */, const OUString&/* Name */, const Reference< XFastAttributeList >&/* Attribs */ )
273{
274 return this;
275}
276
277void SAL_CALL CallbackDocumentHandler::characters( const OUString& aChars )
278{
279 if ( m_xDocumentHandler.is() )
280 m_xDocumentHandler->characters( aChars );
281}
282
283SaxLegacyFastParser::SaxLegacyFastParser( ) : m_aNamespaceHandler( new NamespaceHandler ),
285{
286 m_xParser->setNamespaceHandler( m_aNamespaceHandler );
287}
288
289void SAL_CALL SaxLegacyFastParser::initialize(Sequence< Any > const& rArguments )
290{
291 if (!rArguments.hasElements())
292 return;
293
294 Reference< XFastTokenHandler > xTokenHandler;
295 OUString str;
296 if ( ( rArguments[0] >>= xTokenHandler ) && xTokenHandler.is() )
297 {
298 m_xTokenHandler.set( xTokenHandler );
299 }
300 else if ( ( rArguments[0] >>= str ) && "registerNamespaces" == str )
301 {
302 css::beans::Pair< OUString, sal_Int32 > rPair;
303 for (sal_Int32 i = 1; i < rArguments.getLength(); i++ )
304 {
305 rArguments[i] >>= rPair;
306 m_xParser->registerNamespace( rPair.First, rPair.Second );
307 }
308 }
309 else
310 {
311 uno::Reference<lang::XInitialization> const xInit(m_xParser,
312 uno::UNO_QUERY_THROW);
313 xInit->initialize( rArguments );
314 }
315}
316
317void SaxLegacyFastParser::parseStream( const InputSource& structSource )
318{
319 m_xParser->setFastDocumentHandler( new CallbackDocumentHandler( m_xDocumentHandler,
320 m_aNamespaceHandler, m_xTokenHandler ) );
321 m_xParser->setTokenHandler( m_xTokenHandler );
322 m_xParser->parseStream( structSource );
323}
324
325void SaxLegacyFastParser::setDocumentHandler( const Reference< XDocumentHandler > & xHandler )
326{
327 m_xDocumentHandler = xHandler;
328}
329
330void SaxLegacyFastParser::setErrorHandler( const Reference< XErrorHandler > & xHandler )
331{
332 m_xParser->setErrorHandler( xHandler );
333}
334
335void SaxLegacyFastParser::setDTDHandler( const Reference < XDTDHandler > &/* xHandler */ )
336{
337
338}
339
340void SaxLegacyFastParser::setEntityResolver( const Reference< XEntityResolver >& xResolver )
341{
342 m_xParser->setEntityResolver( xResolver );
343}
344
345void SaxLegacyFastParser::setLocale( const Locale &locale )
346{
347 m_xParser->setLocale( locale );
348}
349
350OUString SaxLegacyFastParser::getImplementationName()
351{
352 return "com.sun.star.comp.extensions.xml.sax.LegacyFastParser";
353}
354
355sal_Bool SaxLegacyFastParser::supportsService(const OUString& ServiceName)
356{
357 return cppu::supportsService(this, ServiceName);
358}
359
360Sequence< OUString > SaxLegacyFastParser::getSupportedServiceNames()
361{
362 return { "com.sun.star.xml.sax.LegacyFastParser" };
363}
364
365} //namespace
366
367extern "C" SAL_DLLPUBLIC_EXPORT css::uno::XInterface *
369 css::uno::XComponentContext *,
370 css::uno::Sequence<css::uno::Any> const &)
371{
372 return cppu::acquire(new SaxLegacyFastParser);
373}
374
375 /* vim:set shiftwidth=4 softtabstop=4 expandtab: */
float u
rtl::Reference< ParserThread > m_xParser
Definition: fastparser.cxx:767
SAL_DLLPUBLIC_EXPORT css::uno::XInterface * com_sun_star_comp_extensions_xml_sax_LegacyFastParser_get_implementation(css::uno::XComponentContext *, css::uno::Sequence< css::uno::Any > const &)
Sequence< sal_Int8 > aSeq
void setLocale(const LanguageTag &languageTag)
Reference< XComponentContext > getProcessComponentContext()
css::uno::Sequence< OUString > getSupportedServiceNames()
OUString getImplementationName()
bool CPPUHELPER_DLLPUBLIC supportsService(css::lang::XServiceInfo *implementation, rtl::OUString const &name)
css::uno::Reference< css::deployment::XPackageRegistry > create(css::uno::Reference< css::deployment::XPackageRegistry > const &xRootRegistry, OUString const &context, OUString const &cachePath, css::uno::Reference< css::uno::XComponentContext > const &xComponentContext)
int i
DefTokenId nToken
unsigned char sal_Bool