1 /* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
3 * This file is part of the LibreOffice project.
5 * This Source Code Form is subject to the terms of the Mozilla Public
6 * License, v. 2.0. If a copy of the MPL was not distributed with this
7 * file, You can obtain one at http://mozilla.org/MPL/2.0/.
9 * This file incorporates work covered by the following license notice:
11 * Licensed to the Apache Software Foundation (ASF) under one or more
12 * contributor license agreements. See the NOTICE file distributed
13 * with this work for additional information regarding copyright
14 * ownership. The ASF licenses this file to you under the Apache
15 * License, Version 2.0 (the "License"); you may not use this file
16 * except in compliance with the License. You may obtain a copy of
17 * the License at http://www.apache.org/licenses/LICENSE-2.0 .
19 #ifndef INCLUDED_SW_SOURCE_FILTER_HTML_SWHTML_HXX
20 #define INCLUDED_SW_SOURCE_FILTER_HTML_SWHTML_HXX
22 #include <config_java.h>
24 #include <sfx2/sfxhtml.hxx>
25 #include <svl/listener.hxx>
26 #include <svl/macitem.hxx>
27 #include <svtools/htmltokn.h>
28 #include <editeng/svxenum.hxx>
29 #include <rtl/ref.hxx>
30 #include <rtl/ustrbuf.hxx>
31 #include <deletelistener.hxx>
33 #include <fltshell.hxx>
34 #include <swtypes.hxx>
36 #include <com/sun/star/drawing/XShape.hpp>
37 #include <com/sun/star/form/XFormComponent.hpp>
38 #include <com/sun/star/beans/XPropertySet.hpp>
50 class SvxMacroTableDtor
;
57 class SwHTMLForm_Impl
;
59 struct SwHTMLFootEndNote_Impl
;
62 class SvxCSS1PropertyInfo
;
65 constexpr tools::Long HTML_CJK_PARSPACE
= o3tl::toTwips(25, o3tl::Length::mm10
); // 2.5mm
66 constexpr tools::Long HTML_CTL_PARSPACE
= o3tl::toTwips(25, o3tl::Length::mm10
); // 2.5mm
68 constexpr tools::Long HTML_DFLT_IMG_WIDTH
= o3tl::toTwips(2, o3tl::Length::cm
); // 2cm
69 constexpr tools::Long HTML_DFLT_IMG_HEIGHT
= o3tl::toTwips(1, o3tl::Length::cm
); // 1cm
71 // some things you often need
72 extern HTMLOptionEnum
<SvxAdjust
> const aHTMLPAlignTable
[];
73 extern HTMLOptionEnum
<sal_Int16
> const aHTMLImgHAlignTable
[];
74 extern HTMLOptionEnum
<sal_Int16
> const aHTMLImgVAlignTable
[];
79 typedef std::deque
<HTMLAttr
*> HTMLAttrs
;
81 // Table of attributes: The order here is important: The attributes in the
82 // beginning of the table will set first in EndAllAttrs.
85 HTMLAttr
* pKeep
; // frame attributes
91 HTMLAttr
* pFirstLineIndent
; // paragraph attributes
92 HTMLAttr
* pTextLeftMargin
;
93 HTMLAttr
* pRightMargin
;
95 HTMLAttr
* pLineSpacing
;
101 HTMLAttr
* pDirection
;
103 HTMLAttr
* pCharFormats
; // text attributes
104 HTMLAttr
* pINetFormat
;
106 HTMLAttr
* pBold
; // character attributes
110 HTMLAttr
* pItalicCJK
;
111 HTMLAttr
* pItalicCTL
;
113 HTMLAttr
* pUnderline
;
118 HTMLAttr
* pFontHeight
;
119 HTMLAttr
* pFontHeightCJK
;
120 HTMLAttr
* pFontHeightCTL
;
121 HTMLAttr
* pFontColor
;
122 HTMLAttr
* pEscapement
;
124 HTMLAttr
* pKerning
; // (only for SPACER)
125 HTMLAttr
* pCharBrush
; // character background
127 HTMLAttr
* pLanguageCJK
;
128 HTMLAttr
* pLanguageCTL
;
134 friend class SwHTMLParser
;
135 friend class CellSaveStruct
;
137 SwNodeIndex m_nStartPara
;
138 SwNodeIndex m_nEndPara
;
139 sal_Int32 m_nStartContent
;
140 sal_Int32 m_nEndContent
;
141 bool m_bInsAtStart
: 1;
142 bool m_bLikePara
: 1; // set attribute above the whole paragraph
143 bool m_bValid
: 1; // is the attribute valid?
145 std::unique_ptr
<SfxPoolItem
> m_pItem
;
146 std::shared_ptr
<HTMLAttrTable
> m_xAttrTab
;
147 HTMLAttr
*m_pNext
; // still to close attributes with different values
148 HTMLAttr
*m_pPrev
; // already closed but not set attributes
149 HTMLAttr
**m_ppHead
; // list head
151 HTMLAttr( const SwPosition
& rPos
, const SfxPoolItem
& rItem
,
152 HTMLAttr
**pHd
, std::shared_ptr
<HTMLAttrTable
> xAttrTab
);
154 HTMLAttr( const HTMLAttr
&rAttr
, const SwNode
&rEndPara
,
155 sal_Int32 nEndCnt
, HTMLAttr
**pHd
, std::shared_ptr
<HTMLAttrTable
> xAttrTab
);
161 HTMLAttr
*Clone( const SwNode
& rEndPara
, sal_Int32 nEndCnt
) const;
162 void Reset( const SwNode
& rSttPara
, sal_Int32 nSttCnt
,
163 HTMLAttr
**pHd
, const std::shared_ptr
<HTMLAttrTable
>& rAttrTab
);
164 inline void SetStart( const SwPosition
& rPos
);
166 SwNodeOffset
GetStartParagraphIdx() const { return m_nStartPara
.GetIndex(); }
167 SwNodeOffset
GetEndParagraphIdx() const { return m_nEndPara
.GetIndex(); }
169 const SwNodeIndex
& GetStartParagraph() const { return m_nStartPara
; }
170 const SwNodeIndex
& GetEndParagraph() const { return m_nEndPara
; }
172 sal_Int32
GetStartContent() const { return m_nStartContent
; }
173 sal_Int32
GetEndContent() const { return m_nEndContent
; }
175 bool IsLikePara() const { return m_bLikePara
; }
176 void SetLikePara() { m_bLikePara
= true; }
178 SfxPoolItem
& GetItem() { return *m_pItem
; }
179 const SfxPoolItem
& GetItem() const { return *m_pItem
; }
181 HTMLAttr
*GetNext() const { return m_pNext
; }
182 void InsertNext( HTMLAttr
*pNxt
) { m_pNext
= pNxt
; }
184 HTMLAttr
*GetPrev() const { return m_pPrev
; }
185 void InsertPrev( HTMLAttr
*pPrv
);
186 void ClearPrev() { m_pPrev
= nullptr; }
188 void SetHead(HTMLAttr
**ppHd
, const std::shared_ptr
<HTMLAttrTable
>& rAttrTab
)
191 m_xAttrTab
= rAttrTab
;
194 // During setting attributes from styles it can happen that these
195 // shouldn't be set anymore. To delete them would be very expensive, because
196 // you don't know all the places where they are linked in. Therefore they're
197 // made invalid and deleted at the next call of SetAttr_().
198 void Invalidate() { m_bValid
= false; }
201 class HTMLAttrContext_SaveDoc
;
203 enum SwHTMLAppendMode
{
204 AM_NORMAL
, // no paragraph spacing handling
205 AM_NOSPACE
, // set spacing hard to 0cm
206 AM_SPACE
, // set spacing hard to 0.5cm
207 AM_SOFTNOSPACE
, // don't set spacing, but save 0cm
211 class HTMLAttrContext
213 HTMLAttrs m_aAttrs
; // the attributes created in the context
215 OUString m_aClass
; // context class
217 std::unique_ptr
<HTMLAttrContext_SaveDoc
> m_pSaveDocContext
;
218 std::unique_ptr
<SfxItemSet
> m_pFrameItemSet
;
220 HtmlTokenId m_nToken
; // the token of the context
222 sal_uInt16 m_nTextFormatColl
; // a style created in the context or zero
224 sal_uInt16 m_nLeftMargin
; // a changed left border
225 sal_uInt16 m_nRightMargin
; // a changed right border
226 sal_uInt16 m_nFirstLineIndent
; // a changed first line indent
228 sal_uInt16 m_nUpperSpace
;
229 sal_uInt16 m_nLowerSpace
;
231 SwHTMLAppendMode m_eAppend
;
233 bool m_bLRSpaceChanged
: 1; // left/right border, changed indent?
234 bool m_bULSpaceChanged
: 1; // top/bottom border changed?
235 bool m_bDefaultTextFormatColl
: 1;// nTextFormatColl is only default
236 bool m_bSpansSection
: 1; // the context opens a SwSection
237 bool m_bPopStack
: 1; // delete above stack elements
238 bool m_bFinishPREListingXMP
: 1;
239 bool m_bRestartPRE
: 1;
240 bool m_bRestartXMP
: 1;
241 bool m_bRestartListing
: 1;
242 bool m_bHeaderOrFooter
: 1;
244 bool m_bVisible
= true;
247 void ClearSaveDocContext();
249 HTMLAttrContext( HtmlTokenId nTokn
, sal_uInt16 nPoolId
, OUString aClass
,
250 bool bDfltColl
=false );
251 explicit HTMLAttrContext( HtmlTokenId nTokn
);
254 HtmlTokenId
GetToken() const { return m_nToken
; }
256 sal_uInt16
GetTextFormatColl() const { return m_bDefaultTextFormatColl
? 0 : m_nTextFormatColl
; }
257 sal_uInt16
GetDefaultTextFormatColl() const { return m_bDefaultTextFormatColl
? m_nTextFormatColl
: 0; }
259 const OUString
& GetClass() const { return m_aClass
; }
261 inline void SetMargins( sal_uInt16 nLeft
, sal_uInt16 nRight
, short nIndent
);
263 bool IsLRSpaceChanged() const { return m_bLRSpaceChanged
; }
264 inline void GetMargins( sal_uInt16
& nLeft
, sal_uInt16
& nRight
,
265 short &nIndent
) const;
267 inline void SetULSpace( sal_uInt16 nUpper
, sal_uInt16 nLower
);
268 bool IsULSpaceChanged() const { return m_bULSpaceChanged
; }
269 inline void GetULSpace( sal_uInt16
& rUpper
, sal_uInt16
& rLower
) const;
271 bool HasAttrs() const { return !m_aAttrs
.empty(); }
272 const HTMLAttrs
& GetAttrs() const { return m_aAttrs
; }
273 HTMLAttrs
& GetAttrs() { return m_aAttrs
; }
275 void SetSpansSection( bool bSet
) { m_bSpansSection
= bSet
; }
276 bool GetSpansSection() const { return m_bSpansSection
; }
278 void SetPopStack( bool bSet
) { m_bPopStack
= bSet
; }
279 bool GetPopStack() const { return m_bPopStack
; }
281 bool HasSaveDocContext() const { return m_pSaveDocContext
!=nullptr; }
282 HTMLAttrContext_SaveDoc
*GetSaveDocContext( bool bCreate
=false );
284 const SfxItemSet
*GetFrameItemSet() const { return m_pFrameItemSet
.get(); }
285 SfxItemSet
*GetFrameItemSet( SwDoc
*pCreateDoc
);
287 void SetFinishPREListingXMP( bool bSet
) { m_bFinishPREListingXMP
= bSet
; }
288 bool IsFinishPREListingXMP() const { return m_bFinishPREListingXMP
; }
290 void SetRestartPRE( bool bSet
) { m_bRestartPRE
= bSet
; }
291 bool IsRestartPRE() const { return m_bRestartPRE
; }
293 void SetRestartXMP( bool bSet
) { m_bRestartXMP
= bSet
; }
294 bool IsRestartXMP() const { return m_bRestartXMP
; }
296 void SetRestartListing( bool bSet
) { m_bRestartListing
= bSet
; }
297 bool IsRestartListing() const { return m_bRestartListing
; }
299 void SetHeaderOrFooter( bool bSet
) { m_bHeaderOrFooter
= bSet
; }
300 bool IsHeaderOrFooter() const { return m_bHeaderOrFooter
; }
302 void SetAppendMode( SwHTMLAppendMode eMode
) { m_eAppend
= eMode
; }
303 SwHTMLAppendMode
GetAppendMode() const { return m_eAppend
; }
305 void SetVisible(bool bVisible
) { m_bVisible
= bVisible
; }
306 bool IsVisible() const { return m_bVisible
; }
309 typedef std::vector
<std::unique_ptr
<HTMLAttrContext
>> HTMLAttrContexts
;
313 class SwHTMLNumRuleInfo
;
315 typedef std::vector
<std::unique_ptr
<ImageMap
>> ImageMaps
;
317 enum class HtmlContextFlags
{
318 ProtectStack
= 0x0001,
320 KeepNumrule
= 0x0004,
324 MultiColMask
= StripPara
| KeepNumrule
| KeepAttrs
// for headers, footers or footnotes
328 template<> struct typed_flags
<HtmlContextFlags
> : is_typed_flags
<HtmlContextFlags
, 0x03f> {};
331 enum class HtmlFrameFormatFlags
{
339 template<> struct typed_flags
<HtmlFrameFormatFlags
> : is_typed_flags
<HtmlFrameFormatFlags
, 0x0f> {};
342 class SwHTMLFrameFormatListener
: public SvtListener
344 SwFrameFormat
* m_pFrameFormat
;
346 SwHTMLFrameFormatListener(SwFrameFormat
* pFrameFormat
);
347 SwFrameFormat
* GetFrameFormat() { return m_pFrameFormat
; }
348 virtual void Notify(const SfxHint
&) override
;
351 class SwHTMLParser
: public SfxHTMLParser
, public SvtListener
353 friend class SectionSaveStruct
;
354 friend class CellSaveStruct
;
355 friend class CaptionSaveStruct
;
360 std::unique_ptr
<ImportProgress
> m_xProgress
;
362 OUString m_aPathToFile
;
364 OUString m_aBasicLib
;
365 OUString m_aBasicModule
;
366 OUString m_aScriptSource
; // content of the current script block
367 OUString m_aScriptType
; // type of read script (StarBasic/VB/JAVA)
368 OUString m_aScriptURL
; // script URL
369 OUString m_aStyleSource
; // content of current style sheet
370 OUString m_aContents
; // text of current marquee, field and so
371 OUStringBuffer m_sTitle
;
372 OUString m_aUnknownToken
; // a started unknown token
373 OUString m_aBulletGrfs
[MAXLEVEL
];
376 std::vector
<sal_uInt16
> m_aBaseFontStack
; // stack for <BASEFONT>
377 // Bit 0-2: font size (1-7)
378 std::vector
<sal_uInt16
> m_aFontStack
; // stack for <FONT>, <BIG>, <SMALL>
379 // Bit 0-2: font size (1-7)
380 // Bit 15: font colour was set
382 HTMLAttrs m_aSetAttrTab
;// "closed", not set attributes
383 HTMLAttrs m_aParaAttrs
; // temporary paragraph attributes
384 std::shared_ptr
<HTMLAttrTable
> m_xAttrTab
; // "open" attributes
385 HTMLAttrContexts m_aContexts
;// the current context of attribute/token
386 std::vector
<std::unique_ptr
<SwHTMLFrameFormatListener
>> m_aMoveFlyFrames
;// Fly-Frames, the anchor is moved
387 std::deque
<sal_Int32
> m_aMoveFlyCnts
;// and the Content-Positions
388 //stray SwTableBoxes which need to be deleted to avoid leaking, but hold
389 //onto them until parsing is done
390 std::vector
<std::unique_ptr
<SwTableBox
>> m_aOrphanedTableBoxes
;
392 std::unique_ptr
<SwApplet_Impl
> m_pAppletImpl
; // current applet
394 std::unique_ptr
<SwCSS1Parser
> m_pCSS1Parser
; // Style-Sheet-Parser
395 std::unique_ptr
<SwHTMLNumRuleInfo
> m_pNumRuleInfo
;
396 std::vector
<SwPending
> m_vPendingStack
;
398 rtl::Reference
<SwDoc
> m_xDoc
;
399 SwPaM
*m_pPam
; // SwPosition should be enough, or ??
400 SwViewShell
*m_pActionViewShell
; // SwViewShell, where StartAction was called
401 SwNodeIndex
*m_pSttNdIdx
;
403 std::vector
<HTMLTable
*> m_aTables
;
404 std::shared_ptr
<HTMLTable
> m_xTable
; // current "outermost" table
405 SwHTMLForm_Impl
* m_pFormImpl
; // current form
406 rtl::Reference
<SdrObject
> m_pMarquee
; // current marquee
407 std::unique_ptr
<SwField
> m_xField
; // current field
408 ImageMap
*m_pImageMap
; // current image map
409 std::unique_ptr
<ImageMaps
> m_pImageMaps
; ///< all Image-Maps that have been read
410 std::unique_ptr
<SwHTMLFootEndNote_Impl
> m_pFootEndNoteImpl
;
412 Size m_aHTMLPageSize
; // page size of HTML template
414 sal_uInt32 m_aFontHeights
[7]; // font heights 1-7
415 ImplSVEvent
* m_nEventId
;
417 sal_uInt16 m_nBaseFontStMin
;
418 sal_uInt16 m_nFontStMin
;
419 sal_uInt16 m_nDefListDeep
;
420 sal_uInt16 m_nFontStHeadStart
; // elements in font stack at <Hn>
421 sal_uInt16 m_nSBModuleCnt
; // counter for basic modules
422 sal_uInt16 m_nMissingImgMaps
; // How many image maps are still missing?
424 size_t m_nContextStMin
; // lower limit of PopContext
425 size_t m_nContextStAttrMin
; // lower limit of attributes
426 sal_uInt16 m_nSelectEntryCnt
; // Number of entries in the actual listbox
427 HtmlTokenId m_nOpenParaToken
; // opened paragraph element
429 enum class JumpToMarks
{ NONE
, Mark
, Table
, Region
, Graphic
};
430 JumpToMarks m_eJumpTo
;
433 sal_uInt16 m_nContinue
; // depth of Continue calls
436 SvxAdjust m_eParaAdjust
; // adjustment of current paragraph
437 HTMLScriptLanguage m_eScriptLang
; // current script language
439 bool m_bOldIsHTMLMode
: 1; // Was it a HTML document?
441 bool m_bDocInitialized
: 1; // document resp. shell was initialize
442 // flag to prevent double init via recursion
443 bool m_bViewCreated
: 1; // the view was already created (asynchronous)
444 bool m_bSetModEnabled
: 1;
446 bool m_bInFloatingFrame
: 1; // We are in a floating frame
448 bool m_bKeepUnknown
: 1; // handle unknown/not supported tokens
450 bool m_bCallNextToken
: 1; // In tables: call NextToken in any case
451 bool m_bIgnoreRawData
: 1; // ignore content of script/style
452 bool m_bLBEntrySelected
: 1; // Is the current option selected?
453 bool m_bTAIgnoreNewPara
: 1; // ignore next LF in text area?
454 bool m_bFixMarqueeWidth
: 1; // Change size of marquee?
456 bool m_bUpperSpace
: 1; // top paragraph spacing is needed
457 bool m_bNoParSpace
: 1;
460 bool m_bInNoEmbed
: 1; // we are in a NOEMBED area
462 bool m_bInTitle
: 1; // we are in title
464 bool m_bChkJumpMark
: 1; // maybe jump to predetermined mark
465 bool m_bUpdateDocStat
: 1;
466 bool m_bFixSelectWidth
: 1; // Set new width of select?
467 bool m_bTextArea
: 1;
470 bool m_bInFootEndNoteAnchor
: 1;
471 bool m_bInFootEndNoteSymbol
: 1;
472 bool m_bIgnoreHTMLComments
: 1;
473 bool m_bRemoveHidden
: 1; // the filter implementation might set the hidden flag
475 bool m_bBodySeen
: 1;
476 bool m_bReadingHeaderOrFooter
: 1;
477 bool m_bNotifyMacroEventRead
: 1;
478 bool m_isInTableStructure
;
481 int m_nFloatingFrames
;
484 /// the names corresponding to the DOCINFO field subtypes INFO[1-4]
485 OUString m_InfoNames
[4];
487 SfxViewFrame
* m_pTempViewFrame
;
489 bool m_bXHTML
= false;
490 bool m_bReqIF
= false;
493 * Non-owning pointers to already inserted OLE nodes, matching opened
494 * <object> XHTML elements.
496 std::stack
<SwOLENode
*> m_aEmbeds
;
498 std::set
<OUString
> m_aAllowedRTFOLEMimeTypes
;
500 /// This is the URL of the outer <object> data if it's not OLE2 or an image.
501 OUString m_aEmbedURL
;
503 void DeleteFormImpl();
505 void DocumentDetected();
508 SwViewShell
*CallStartAction( SwViewShell
*pVSh
= nullptr, bool bChkPtr
= true );
509 SwViewShell
*CallEndAction( bool bChkAction
= false, bool bChkPtr
= true );
510 SwViewShell
*CheckActionViewShell();
512 DECL_LINK( AsyncCallback
, void*, void );
514 // set attribute on document
515 void SetAttr_( bool bChkEnd
, bool bBeforeTable
, std::deque
<std::unique_ptr
<HTMLAttr
>> *pPostIts
);
516 void SetAttr( bool bChkEnd
= true, bool bBeforeTable
= false,
517 std::deque
<std::unique_ptr
<HTMLAttr
>> *pPostIts
= nullptr )
519 if( !m_aSetAttrTab
.empty() || !m_aMoveFlyFrames
.empty() )
520 SetAttr_( bChkEnd
, bBeforeTable
, pPostIts
);
523 HTMLAttr
**GetAttrTabEntry( sal_uInt16 nWhich
);
525 // create a new text node on PaM position
526 bool AppendTextNode( SwHTMLAppendMode eMode
=AM_NORMAL
, bool bUpdateNum
=true );
529 // start/end an attribute
530 // ppDepAttr indicated an attribute table entry, which attribute has to be
531 // set, before the attribute is closed
532 void NewAttr(const std::shared_ptr
<HTMLAttrTable
>& rAttrTab
, HTMLAttr
**ppAttr
, const SfxPoolItem
& rItem
);
533 bool EndAttr( HTMLAttr
*pAttr
, bool bChkEmpty
=true );
534 void DeleteAttr( HTMLAttr
* pAttr
);
536 void EndContextAttrs( HTMLAttrContext
*pContext
);
537 void SaveAttrTab(std::shared_ptr
<HTMLAttrTable
> const & rNewAttrTab
);
538 void SplitAttrTab( const SwPosition
& rNewPos
);
539 void SplitAttrTab(std::shared_ptr
<HTMLAttrTable
> const & rNewAttrTab
, bool bMoveEndBack
);
540 void RestoreAttrTab(std::shared_ptr
<HTMLAttrTable
> const & rNewAttrTab
);
541 void InsertAttr( const SfxPoolItem
& rItem
, bool bInsAtStart
);
542 void InsertAttrs( std::deque
<std::unique_ptr
<HTMLAttr
>> rAttrs
);
544 bool DoPositioning( SfxItemSet
&rItemSet
,
545 SvxCSS1PropertyInfo
&rPropInfo
,
546 HTMLAttrContext
*pContext
);
547 bool CreateContainer( std::u16string_view rClass
, SfxItemSet
&rItemSet
,
548 SvxCSS1PropertyInfo
&rPropInfo
,
549 HTMLAttrContext
*pContext
);
550 bool EndSection( bool bLFStripped
=false );
552 void InsertAttrs( SfxItemSet
&rItemSet
, SvxCSS1PropertyInfo
const &rPropInfo
,
553 HTMLAttrContext
*pContext
, bool bCharLvl
=false );
554 void InsertAttr( HTMLAttr
**ppAttr
, const SfxPoolItem
& rItem
,
555 HTMLAttrContext
*pCntxt
);
556 void SplitPREListingXMP( HTMLAttrContext
*pCntxt
);
557 void FixHeaderFooterDistance( bool bHeader
, const SwPosition
*pOldPos
);
559 void EndContext( HTMLAttrContext
*pContext
);
560 void ClearContext( HTMLAttrContext
*pContext
);
562 const SwFormatColl
*GetCurrFormatColl() const;
564 SwTwips
GetCurrentBrowseWidth();
566 SwHTMLNumRuleInfo
& GetNumInfo() { return *m_pNumRuleInfo
; }
567 // add parameter <bCountedInList>
568 void SetNodeNum( sal_uInt8 nLevel
);
570 // Manage paragraph styles
572 // set the style resp. its attributes on the stack
573 void SetTextCollAttrs( HTMLAttrContext
*pContext
= nullptr );
575 void InsertParaAttrs( const SfxItemSet
& rItemSet
);
577 // Manage attribute context
579 // save current context
580 void PushContext(std::unique_ptr
<HTMLAttrContext
>& rCntxt
)
582 m_aContexts
.push_back(std::move(rCntxt
));
585 // Fetch top/specified context but not outside the context with token
586 // nLimit. If bRemove set then remove it.
587 std::unique_ptr
<HTMLAttrContext
> PopContext(HtmlTokenId nToken
= HtmlTokenId::NONE
);
589 void GetMarginsFromContext( sal_uInt16
&nLeft
, sal_uInt16
&nRight
, short& nIndent
,
590 bool bIgnoreCurrent
=false ) const;
591 void GetMarginsFromContextWithNumberBullet( sal_uInt16
&nLeft
, sal_uInt16
&nRight
,
592 short& nIndent
) const;
593 void GetULSpaceFromContext( sal_uInt16
&rUpper
, sal_uInt16
&rLower
) const;
595 void MovePageDescAttrs( SwNode
*pSrcNd
, SwNodeOffset nDestIdx
, bool bFormatBreak
);
597 // Handling of tags at paragraph level
599 // <P> and <H1> to <H6>
601 void EndPara( bool bReal
= false );
602 void NewHeading( HtmlTokenId nToken
);
605 // <ADDRESS>, <BLOCKQUOTE> and <PRE>
606 void NewTextFormatColl( HtmlTokenId nToken
, sal_uInt16 nPoolId
);
607 void EndTextFormatColl( HtmlTokenId nToken
);
609 // <DIV> and <CENTER>
610 void NewDivision( HtmlTokenId nToken
);
613 // insert/close Fly-Frames
614 void InsertFlyFrame( const SfxItemSet
& rItemSet
, HTMLAttrContext
*pCntxt
,
615 const OUString
& rId
);
617 void SaveDocContext( HTMLAttrContext
*pCntxt
, HtmlContextFlags nFlags
,
618 const SwPosition
*pNewPos
);
619 void RestoreDocContext( HTMLAttrContext
*pCntxt
);
621 // end all opened <DIV> areas
622 bool EndSections( bool bLFStripped
);
625 void NewMultiCol( sal_uInt16 columnsFromCss
=0 );
628 void NewMarquee( HTMLTable
*pCurTable
=nullptr );
630 void InsertMarqueeText();
634 // order list <OL> and unordered list <UL> with <LI>
635 void NewNumberBulletList( HtmlTokenId nToken
);
636 void EndNumberBulletList( HtmlTokenId nToken
= HtmlTokenId::NONE
);
637 void NewNumberBulletListItem( HtmlTokenId nToken
);
638 void EndNumberBulletListItem( HtmlTokenId nToken
, bool bSetColl
);
640 // definitions lists <DL> with <DD>, <DT>
643 void NewDefListItem( HtmlTokenId nToken
);
644 void EndDefListItem( HtmlTokenId nToken
= HtmlTokenId::NONE
);
646 // Handling of tags on character level
648 // handle tags like <B>, <I> and so, which enable/disable a certain
649 // attribute or like <SPAN> get attributes from styles
650 void NewStdAttr( HtmlTokenId nToken
);
651 void NewStdAttr( HtmlTokenId nToken
,
652 HTMLAttr
**ppAttr
, const SfxPoolItem
& rItem
,
653 HTMLAttr
**ppAttr2
=nullptr, const SfxPoolItem
*pItem2
=nullptr,
654 HTMLAttr
**ppAttr3
=nullptr, const SfxPoolItem
*pItem3
=nullptr );
655 void EndTag( HtmlTokenId nToken
);
657 // handle font attributes
658 void NewBasefontAttr(); // for <BASEFONT>
659 void EndBasefontAttr();
660 void NewFontAttr( HtmlTokenId nToken
); // for <FONT>, <BIG> and <SMALL>
661 void EndFontAttr( HtmlTokenId nToken
);
663 // tags realized via character styles
664 void NewCharFormat( HtmlTokenId nToken
);
666 void DeleteSection(SwStartNode
* pSttNd
);
670 static SvxNumType
GetNumType( std::u16string_view rStr
, SvxNumType eDfltType
);
674 void InsertFieldText();
679 // Inserting graphics, plug-ins and applets
681 // search image maps and link with graphic nodes
682 ImageMap
*FindImageMap( std::u16string_view rURL
) const;
683 void ConnectImageMaps();
685 // find anchor of Fly-Frames and set corresponding attributes
686 // in Attrset (htmlgrin.cxx)
687 void SetAnchorAndAdjustment( sal_Int16 eVertOri
,
689 const SvxCSS1PropertyInfo
&rPropInfo
,
690 SfxItemSet
& rFrameSet
);
691 void SetAnchorAndAdjustment( sal_Int16 eVertOri
,
693 SfxItemSet
& rFrameSet
,
694 bool bDontAppend
=false );
695 void SetAnchorAndAdjustment( const SvxCSS1PropertyInfo
&rPropInfo
,
696 SfxItemSet
&rFrameItemSet
);
698 static void SetFrameFormatAttrs( SfxItemSet
&rItemSet
,
699 HtmlFrameFormatFlags nFlags
, SfxItemSet
&rFrameItemSet
);
701 // create frames and register auto bound frames
702 void RegisterFlyFrame( SwFrameFormat
*pFlyFrame
);
704 // Adjust the size of the Fly-Frames to requirements and conditions
705 // (not for graphics, therefore htmlplug.cxx)
706 static void SetFixSize( const Size
& rPixSize
, const Size
& rTwipDfltSize
,
707 bool bPercentWidth
, bool bPercentHeight
,
708 SvxCSS1PropertyInfo
const &rPropInfo
,
709 SfxItemSet
& rFlyItemSet
);
710 static void SetVarSize( SvxCSS1PropertyInfo
const &rPropInfo
,
711 SfxItemSet
& rFlyItemSet
, SwTwips nDfltWidth
=MINLAY
,
712 sal_uInt8 nDefaultPercentWidth
=0 );
713 static void SetSpace( const Size
& rPixSpace
, SfxItemSet
&rItemSet
,
714 SvxCSS1PropertyInfo
&rPropInfo
, SfxItemSet
& rFlyItemSet
);
716 sal_uInt16
IncGrfsThatResizeTable();
718 void GetDefaultScriptType( ScriptType
& rType
,
719 OUString
& rTypeStr
) const;
721 // the actual insert methods for <IMG>, <EMBED>, <APPLET> and <PARAM>
722 void InsertImage(); // htmlgrin.cxx
723 bool InsertEmbed(); // htmlplug.cxx
725 #if HAVE_FEATURE_JAVA
726 void NewObject(); // htmlplug.cxx
728 void EndObject(); // link CommandLine with applet (htmlplug.cxx)
729 #if HAVE_FEATURE_JAVA
730 void InsertApplet(); // htmlplug.cxx
732 void EndApplet(); // link CommandLine with applet (htmlplug.cxx)
733 void InsertParam(); // htmlplug.cxx
735 void InsertFloatingFrame();
737 // parse <BODY>-tag: set background graphic and background colour (htmlgrin.cxx)
738 void InsertBodyOptions();
740 // Inserting links and bookmarks (htmlgrin.cxx)
742 // parse <A>-tag: insert a link resp. bookmark
747 void InsertBookmark( const OUString
& rName
);
749 void InsertCommentText( std::string_view pTag
);
750 void InsertComment( const OUString
& rName
, std::string_view pTag
= {} );
752 // Has the current paragraph bookmarks?
753 bool HasCurrentParaBookmarks( bool bIgnoreStack
=false ) const;
755 // Inserting script/basic elements
757 // parse the last read basic module (htmlbas.cxx)
761 void AddScriptSource();
763 // insert event in SFX configuration (htmlbas.cxx)
764 void InsertBasicDocEvent( const OUString
& aEventName
, const OUString
& rName
,
765 ScriptType eScrType
, const OUString
& rScrType
);
773 static inline bool HasStyleOptions( std::u16string_view rStyle
, std::u16string_view rId
,
774 std::u16string_view rClass
, const OUString
*pLang
=nullptr,
775 const OUString
*pDir
=nullptr );
776 bool ParseStyleOptions( const OUString
&rStyle
, const OUString
&rId
,
777 const OUString
&rClass
, SfxItemSet
&rItemSet
,
778 SvxCSS1PropertyInfo
&rPropInfo
,
779 const OUString
*pLang
=nullptr, const OUString
*pDir
=nullptr );
781 // Inserting Controls and Forms (htmlform.cxx)
783 // Insert draw object into document
784 void InsertDrawObject( SdrObject
* pNewDrawObj
, const Size
& rSpace
,
787 SfxItemSet
& rCSS1ItemSet
,
788 SvxCSS1PropertyInfo
& rCSS1PropInfo
);
789 css::uno::Reference
< css::drawing::XShape
> InsertControl(
790 const css::uno::Reference
< css::form::XFormComponent
> & rFormComp
,
791 const css::uno::Reference
< css::beans::XPropertySet
> & rFCompPropSet
,
795 SfxItemSet
& rCSS1ItemSet
,
796 SvxCSS1PropertyInfo
& rCSS1PropInfo
,
797 const SvxMacroTableDtor
& rMacroTable
,
798 const std::vector
<OUString
>& rUnoMacroTable
,
799 const std::vector
<OUString
>& rUnoMacroParamTable
,
800 bool bSetPropSet
= true,
801 bool bHidden
= false );
802 void SetControlSize( const css::uno::Reference
< css::drawing::XShape
> & rShape
, const Size
& rTextSz
,
803 bool bMinWidth
, bool bMinHeight
);
806 static void ResizeDrawObject( SdrObject
* pObj
, SwTwips nWidth
);
808 static void RegisterDrawObjectToTable( HTMLTable
*pCurTable
, SdrObject
* pObj
,
811 void NewForm( bool bAppend
=true );
812 void EndForm( bool bAppend
=true );
814 // Insert methods for <INPUT>, <TEXTAREA> and <SELECT>
818 void InsertTextAreaText( HtmlTokenId nToken
);
822 void InsertSelectOption();
823 void InsertSelectText();
826 // Inserting tables (htmltab.cxx)
829 // Insert box content after the given node
830 const SwStartNode
*InsertTableSection( const SwStartNode
*pPrevStNd
);
832 // Insert box content at the end of the table containing the PaM
833 // and move the PaM into the cell
834 const SwStartNode
*InsertTableSection( sal_uInt16 nPoolId
);
836 // Insert methods for various table tags
837 std::unique_ptr
<HTMLTableCnts
> InsertTableContents( bool bHead
);
840 // Create a section for the temporary storage of the table caption
841 SwStartNode
*InsertTempTableCaptionSection();
843 void BuildTableCell( HTMLTable
*pTable
, bool bReadOptions
, bool bHead
);
844 void BuildTableRow( HTMLTable
*pTable
, bool bReadOptions
,
845 SvxAdjust eGrpAdjust
, sal_Int16 eVertOri
);
846 void BuildTableSection( HTMLTable
*pTable
, bool bReadOptions
, bool bHead
);
847 void BuildTableColGroup( HTMLTable
*pTable
, bool bReadOptions
);
848 void BuildTableCaption( HTMLTable
*pTable
);
849 std::shared_ptr
<HTMLTable
> BuildTable(SvxAdjust eCellAdjust
,
850 bool bIsParentHead
= false,
851 bool bHasParentSection
=true,
852 bool bHasToFlow
= false);
856 void ParseMoreMetaOptions();
858 bool FileDownload( const OUString
& rURL
, OUString
& rStr
);
861 void InsertIDOption();
862 void InsertLineBreak();
863 void InsertHorzRule();
865 void FillEndNoteInfo( std::u16string_view aContent
);
866 void FillFootNoteInfo( std::u16string_view aContent
);
867 void InsertFootEndNote( const OUString
& rName
, bool bEndNote
, bool bFixed
);
868 void FinishFootEndNote();
869 void InsertFootEndNoteText();
870 SwNodeIndex
*GetFootEndNoteSection( const OUString
& rName
);
872 sal_Int32
StripTrailingLF();
874 // Remove empty paragraph at the PaM position
875 void StripTrailingPara();
876 // If removing an empty node would corrupt the document
877 bool CanRemoveNode(SwNodeOffset nNodeIdx
) const;
879 // Are there fly frames in the current paragraph?
880 bool HasCurrentParaFlys( bool bNoSurroundOnly
= false,
881 bool bSurroundOnly
= false ) const;
883 class TableDepthGuard
886 SwHTMLParser
& m_rParser
;
888 TableDepthGuard(SwHTMLParser
& rParser
)
891 ++m_rParser
.m_nTableDepth
;
893 bool TooDeep() const { return m_rParser
.m_nTableDepth
> 1024; }
896 --m_rParser
.m_nTableDepth
;
900 public: // used in tables
902 // Create brush item (with new) or 0
903 SvxBrushItem
* CreateBrushItem( const Color
*pColor
,
904 const OUString
&rImageURL
,
905 const OUString
&rStyle
,
907 const OUString
&rClass
);
910 // Executed for each token recognized by CallParser
911 virtual void NextToken( HtmlTokenId nToken
) override
;
912 virtual ~SwHTMLParser() override
;
914 // If the document is removed, remove the parser as well
915 virtual void Notify(const SfxHint
&) override
;
917 virtual void AddMetaUserDefined( OUString
const & i_rMetaName
) override
;
921 SwHTMLParser( SwDoc
* pD
, SwPaM
& rCursor
, SvStream
& rIn
,
925 SfxMedium
* pMed
, bool bReadUTF8
,
926 bool bIgnoreHTMLComments
,
927 const OUString
& rNamespace
);
929 virtual SvParserState
CallParser() override
;
931 static sal_uInt16
ToTwips( sal_uInt16 nPixel
);
933 // for reading asynchronously from SvStream
934 virtual void Continue( HtmlTokenId nToken
) override
;
936 virtual bool ParseMetaOptions( const css::uno::Reference
<css::document::XDocumentProperties
>&,
937 SvKeyValueIterator
* ) override
;
940 void RegisterHTMLTable(HTMLTable
* pNew
)
942 m_aTables
.push_back(pNew
);
945 void DeregisterHTMLTable(HTMLTable
* pOld
);
947 SwDoc
* GetDoc() const;
949 bool IsReqIF() const;
951 bool IsReadingHeaderOrFooter() const { return m_bReadingHeaderOrFooter
; }
953 void NotifyMacroEventRead();
955 /// Strips query and fragment from a URL path if base URL is a file:// one.
956 static OUString
StripQueryFromPath(std::u16string_view rBase
, const OUString
& rPath
);
961 virtual ~SwPendingData() {}
967 std::unique_ptr
<SwPendingData
> pData
;
969 SwPending( HtmlTokenId nTkn
)
974 inline void HTMLAttr::SetStart( const SwPosition
& rPos
)
976 m_nStartPara
= rPos
.GetNode();
977 m_nStartContent
= rPos
.GetContentIndex();
978 m_nEndPara
= m_nStartPara
;
979 m_nEndContent
= m_nStartContent
;
982 inline void HTMLAttrContext::SetMargins( sal_uInt16 nLeft
, sal_uInt16 nRight
,
985 m_nLeftMargin
= nLeft
;
986 m_nRightMargin
= nRight
;
987 m_nFirstLineIndent
= nIndent
;
988 m_bLRSpaceChanged
= true;
991 inline void HTMLAttrContext::GetMargins( sal_uInt16
& nLeft
,
993 short& nIndent
) const
995 if( m_bLRSpaceChanged
)
997 nLeft
= m_nLeftMargin
;
998 nRight
= m_nRightMargin
;
999 nIndent
= m_nFirstLineIndent
;
1003 inline void HTMLAttrContext::SetULSpace( sal_uInt16 nUpper
, sal_uInt16 nLower
)
1005 m_nUpperSpace
= nUpper
;
1006 m_nLowerSpace
= nLower
;
1007 m_bULSpaceChanged
= true;
1010 inline void HTMLAttrContext::GetULSpace( sal_uInt16
& rUpper
,
1011 sal_uInt16
& rLower
) const
1013 if( m_bULSpaceChanged
)
1015 rUpper
= m_nUpperSpace
;
1016 rLower
= m_nLowerSpace
;
1020 inline bool SwHTMLParser::HasStyleOptions( std::u16string_view rStyle
,
1021 std::u16string_view rId
,
1022 std::u16string_view rClass
,
1023 const OUString
*pLang
,
1024 const OUString
*pDir
)
1026 return !rStyle
.empty() || !rId
.empty() || !rClass
.empty() ||
1027 (pLang
&& !pLang
->isEmpty()) || (pDir
&& !pDir
->isEmpty());
1030 class SwTextFootnote
;
1032 class SwHTMLTextFootnote
1036 SwTextFootnote
* m_pTextFootnote
;
1037 std::unique_ptr
<SvtDeleteListener
> m_xDeleteListener
;
1039 SwHTMLTextFootnote(OUString rName
, SwTextFootnote
* pInTextFootnote
)
1040 : m_sName(std::move(rName
))
1041 , m_pTextFootnote(pInTextFootnote
)
1042 , m_xDeleteListener(new SvtDeleteListener(static_cast<SwFormatFootnote
&>(pInTextFootnote
->GetAttr()).GetNotifier()))
1045 const OUString
& GetName() const
1049 const SwNodeIndex
* GetStartNode() const
1051 if (m_xDeleteListener
->WasDeleted())
1053 return m_pTextFootnote
->GetStartNode();
1057 struct SwHTMLFootEndNote_Impl
1059 std::vector
<SwHTMLTextFootnote
> aTextFootnotes
;
1062 OUString sContent
; // information for the last footnote
1069 /* vim:set shiftwidth=4 softtabstop=4 expandtab: */