Version 7.1.7.1, tag libreoffice-7.1.7.1
[LibreOffice.git] / linguistic / source / gciterator.cxx
blobad2c377e6e6d29b9f0d6740462df98834d66224a
1 /* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
2 /*
3 * This file is part of the LibreOffice project.
5 * This Source Code Form is subject to the terms of the Mozilla Public
6 * License, v. 2.0. If a copy of the MPL was not distributed with this
7 * file, You can obtain one at http://mozilla.org/MPL/2.0/.
9 * This file incorporates work covered by the following license notice:
11 * Licensed to the Apache Software Foundation (ASF) under one or more
12 * contributor license agreements. See the NOTICE file distributed
13 * with this work for additional information regarding copyright
14 * ownership. The ASF licenses this file to you under the Apache
15 * License, Version 2.0 (the "License"); you may not use this file
16 * except in compliance with the License. You may obtain a copy of
17 * the License at http://www.apache.org/licenses/LICENSE-2.0 .
20 #include <sal/macros.h>
21 #include <com/sun/star/beans/XPropertySet.hpp>
22 #include <com/sun/star/container/ElementExistException.hpp>
23 #include <com/sun/star/container/XNameAccess.hpp>
24 #include <com/sun/star/configuration/theDefaultProvider.hpp>
25 #include <com/sun/star/i18n/BreakIterator.hpp>
26 #include <com/sun/star/lang/IndexOutOfBoundsException.hpp>
27 #include <com/sun/star/lang/XComponent.hpp>
28 #include <com/sun/star/lang/XServiceInfo.hpp>
29 #include <com/sun/star/lang/XMultiServiceFactory.hpp>
30 #include <com/sun/star/linguistic2/XSupportedLocales.hpp>
31 #include <com/sun/star/linguistic2/XProofreader.hpp>
32 #include <com/sun/star/linguistic2/XProofreadingIterator.hpp>
33 #include <com/sun/star/linguistic2/SingleProofreadingError.hpp>
34 #include <com/sun/star/linguistic2/ProofreadingResult.hpp>
35 #include <com/sun/star/linguistic2/LinguServiceEvent.hpp>
36 #include <com/sun/star/linguistic2/LinguServiceEventFlags.hpp>
37 #include <com/sun/star/text/TextMarkupType.hpp>
38 #include <com/sun/star/text/TextMarkupDescriptor.hpp>
39 #include <com/sun/star/text/XMultiTextMarkup.hpp>
40 #include <com/sun/star/text/XFlatParagraph.hpp>
41 #include <com/sun/star/text/XFlatParagraphIterator.hpp>
42 #include <com/sun/star/uno/XComponentContext.hpp>
44 #include <sal/config.h>
45 #include <sal/log.hxx>
46 #include <o3tl/safeint.hxx>
47 #include <osl/conditn.hxx>
48 #include <cppuhelper/supportsservice.hxx>
49 #include <cppuhelper/weak.hxx>
50 #include <i18nlangtag/languagetag.hxx>
51 #include <comphelper/processfactory.hxx>
52 #include <comphelper/propertysequence.hxx>
53 #include <tools/debug.hxx>
54 #include <tools/diagnose_ex.h>
56 #include <map>
58 #include <linguistic/misc.hxx>
60 #include "gciterator.hxx"
62 using namespace linguistic;
63 using namespace ::com::sun::star;
65 // white space list: obtained from the fonts.config.txt of a Linux system.
66 const sal_Unicode aWhiteSpaces[] =
68 0x0020, /* SPACE */
69 0x00a0, /* NO-BREAK SPACE */
70 0x00ad, /* SOFT HYPHEN */
71 0x115f, /* HANGUL CHOSEONG FILLER */
72 0x1160, /* HANGUL JUNGSEONG FILLER */
73 0x1680, /* OGHAM SPACE MARK */
74 0x2000, /* EN QUAD */
75 0x2001, /* EM QUAD */
76 0x2002, /* EN SPACE */
77 0x2003, /* EM SPACE */
78 0x2004, /* THREE-PER-EM SPACE */
79 0x2005, /* FOUR-PER-EM SPACE */
80 0x2006, /* SIX-PER-EM SPACE */
81 0x2007, /* FIGURE SPACE */
82 0x2008, /* PUNCTUATION SPACE */
83 0x2009, /* THIN SPACE */
84 0x200a, /* HAIR SPACE */
85 0x200b, /* ZERO WIDTH SPACE */
86 0x200c, /* ZERO WIDTH NON-JOINER */
87 0x200d, /* ZERO WIDTH JOINER */
88 0x200e, /* LEFT-TO-RIGHT MARK */
89 0x200f, /* RIGHT-TO-LEFT MARK */
90 0x2028, /* LINE SEPARATOR */
91 0x2029, /* PARAGRAPH SEPARATOR */
92 0x202a, /* LEFT-TO-RIGHT EMBEDDING */
93 0x202b, /* RIGHT-TO-LEFT EMBEDDING */
94 0x202c, /* POP DIRECTIONAL FORMATTING */
95 0x202d, /* LEFT-TO-RIGHT OVERRIDE */
96 0x202e, /* RIGHT-TO-LEFT OVERRIDE */
97 0x202f, /* NARROW NO-BREAK SPACE */
98 0x205f, /* MEDIUM MATHEMATICAL SPACE */
99 0x2060, /* WORD JOINER */
100 0x2061, /* FUNCTION APPLICATION */
101 0x2062, /* INVISIBLE TIMES */
102 0x2063, /* INVISIBLE SEPARATOR */
103 0x206A, /* INHIBIT SYMMETRIC SWAPPING */
104 0x206B, /* ACTIVATE SYMMETRIC SWAPPING */
105 0x206C, /* INHIBIT ARABIC FORM SHAPING */
106 0x206D, /* ACTIVATE ARABIC FORM SHAPING */
107 0x206E, /* NATIONAL DIGIT SHAPES */
108 0x206F, /* NOMINAL DIGIT SHAPES */
109 0x3000, /* IDEOGRAPHIC SPACE */
110 0x3164, /* HANGUL FILLER */
111 0xfeff, /* ZERO WIDTH NO-BREAK SPACE */
112 0xffa0, /* HALFWIDTH HANGUL FILLER */
113 0xfff9, /* INTERLINEAR ANNOTATION ANCHOR */
114 0xfffa, /* INTERLINEAR ANNOTATION SEPARATOR */
115 0xfffb /* INTERLINEAR ANNOTATION TERMINATOR */
118 // Information about reason for proofreading (ProofInfo)
119 const sal_Int32 PROOFINFO_GET_PROOFRESULT = 1;
120 const sal_Int32 PROOFINFO_MARK_PARAGRAPH = 2;
122 const int nWhiteSpaces = SAL_N_ELEMENTS( aWhiteSpaces );
124 static bool lcl_IsWhiteSpace( sal_Unicode cChar )
126 bool bFound = false;
127 for (int i = 0; i < nWhiteSpaces && !bFound; ++i)
129 if (cChar == aWhiteSpaces[i])
130 bFound = true;
132 return bFound;
135 static sal_Int32 lcl_SkipWhiteSpaces( const OUString &rText, sal_Int32 nStartPos )
137 // note having nStartPos point right behind the string is OK since that one
138 // is a correct end-of-sentence position to be returned from a grammar checker...
140 const sal_Int32 nLen = rText.getLength();
141 bool bIllegalArgument = false;
142 if (nStartPos < 0)
144 bIllegalArgument = true;
145 nStartPos = 0;
147 if (nStartPos > nLen)
149 bIllegalArgument = true;
150 nStartPos = nLen;
152 if (bIllegalArgument)
154 SAL_WARN( "linguistic", "lcl_SkipWhiteSpaces: illegal arguments" );
157 sal_Int32 nRes = nStartPos;
158 if (0 <= nStartPos && nStartPos < nLen)
160 const sal_Unicode* const pEnd = rText.getStr() + nLen;
161 const sal_Unicode *pText = rText.getStr() + nStartPos;
162 while (pText != pEnd && lcl_IsWhiteSpace(*pText))
163 ++pText;
164 nRes = pText - rText.getStr();
167 DBG_ASSERT( 0 <= nRes && nRes <= nLen, "lcl_SkipWhiteSpaces return value out of range" );
168 return nRes;
171 static sal_Int32 lcl_BacktraceWhiteSpaces( const OUString &rText, sal_Int32 nStartPos )
173 // note: having nStartPos point right behind the string is OK since that one
174 // is a correct end-of-sentence position to be returned from a grammar checker...
176 const sal_Int32 nLen = rText.getLength();
177 bool bIllegalArgument = false;
178 if (nStartPos < 0)
180 bIllegalArgument = true;
181 nStartPos = 0;
183 if (nStartPos > nLen)
185 bIllegalArgument = true;
186 nStartPos = nLen;
188 if (bIllegalArgument)
190 SAL_WARN( "linguistic", "lcl_BacktraceWhiteSpaces: illegal arguments" );
193 sal_Int32 nRes = nStartPos;
194 sal_Int32 nPosBefore = nStartPos - 1;
195 const sal_Unicode *pStart = rText.getStr();
196 if (0 <= nPosBefore && nPosBefore < nLen && lcl_IsWhiteSpace( pStart[ nPosBefore ] ))
198 nStartPos = nPosBefore;
199 const sal_Unicode *pText = rText.getStr() + nStartPos;
200 while (pText > pStart && lcl_IsWhiteSpace( *pText ))
201 --pText;
202 // now add 1 since we want to point to the first char after the last char in the sentence...
203 nRes = pText - pStart + 1;
206 DBG_ASSERT( 0 <= nRes && nRes <= nLen, "lcl_BacktraceWhiteSpaces return value out of range" );
207 return nRes;
211 extern "C" {
213 static void lcl_workerfunc (void * gci)
215 osl_setThreadName("GrammarCheckingIterator");
217 static_cast<GrammarCheckingIterator*>(gci)->DequeueAndCheck();
222 static lang::Locale lcl_GetPrimaryLanguageOfSentence(
223 const uno::Reference< text::XFlatParagraph >& xFlatPara,
224 sal_Int32 nStartIndex )
226 //get the language of the first word
227 return xFlatPara->getLanguageOfText( nStartIndex, 1 );
231 LngXStringKeyMap::LngXStringKeyMap() {}
233 void SAL_CALL LngXStringKeyMap::insertValue(const OUString& aKey, const css::uno::Any& aValue)
235 std::map<OUString, css::uno::Any>::const_iterator aIter = maMap.find(aKey);
236 if (aIter != maMap.end())
237 throw css::container::ElementExistException();
239 maMap[aKey] = aValue;
242 css::uno::Any SAL_CALL LngXStringKeyMap::getValue(const OUString& aKey)
244 std::map<OUString, css::uno::Any>::const_iterator aIter = maMap.find(aKey);
245 if (aIter == maMap.end())
246 throw css::container::NoSuchElementException();
248 return (*aIter).second;
251 sal_Bool SAL_CALL LngXStringKeyMap::hasValue(const OUString& aKey)
253 return maMap.find(aKey) != maMap.end();
256 ::sal_Int32 SAL_CALL LngXStringKeyMap::getCount() { return maMap.size(); }
258 OUString SAL_CALL LngXStringKeyMap::getKeyByIndex(::sal_Int32 nIndex)
260 if (nIndex < 0 || o3tl::make_unsigned(nIndex) >= maMap.size())
261 throw css::lang::IndexOutOfBoundsException();
263 return OUString();
266 css::uno::Any SAL_CALL LngXStringKeyMap::getValueByIndex(::sal_Int32 nIndex)
268 if (nIndex < 0 || o3tl::make_unsigned(nIndex) >= maMap.size())
269 throw css::lang::IndexOutOfBoundsException();
271 return css::uno::Any();
275 GrammarCheckingIterator::GrammarCheckingIterator() :
276 m_bEnd( false ),
277 m_aCurCheckedDocId(),
278 m_bGCServicesChecked( false ),
279 m_nDocIdCounter( 0 ),
280 m_thread(nullptr),
281 m_aEventListeners( MyMutex::get() ),
282 m_aNotifyListeners( MyMutex::get() )
287 GrammarCheckingIterator::~GrammarCheckingIterator()
289 TerminateThread();
292 void GrammarCheckingIterator::TerminateThread()
294 oslThread t;
296 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
297 t = m_thread;
298 m_thread = nullptr;
299 m_bEnd = true;
300 m_aWakeUpThread.set();
302 if (t != nullptr)
304 osl_joinWithThread(t);
305 osl_destroyThread(t);
309 sal_Int32 GrammarCheckingIterator::NextDocId()
311 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
312 m_nDocIdCounter += 1;
313 return m_nDocIdCounter;
317 OUString GrammarCheckingIterator::GetOrCreateDocId(
318 const uno::Reference< lang::XComponent > &xComponent )
320 // internal method; will always be called with locked mutex
322 OUString aRes;
323 if (xComponent.is())
325 if (m_aDocIdMap.find( xComponent.get() ) != m_aDocIdMap.end())
327 // return already existing entry
328 aRes = m_aDocIdMap[ xComponent.get() ];
330 else // add new entry
332 sal_Int32 nRes = NextDocId();
333 aRes = OUString::number( nRes );
334 m_aDocIdMap[ xComponent.get() ] = aRes;
335 xComponent->addEventListener( this );
338 return aRes;
342 void GrammarCheckingIterator::AddEntry(
343 const uno::WeakReference< text::XFlatParagraphIterator >& xFlatParaIterator,
344 const uno::WeakReference< text::XFlatParagraph >& xFlatPara,
345 const OUString & rDocId,
346 sal_Int32 nStartIndex,
347 bool bAutomatic )
349 // we may not need/have a xFlatParaIterator (e.g. if checkGrammarAtPos was called)
350 // but we always need a xFlatPara...
351 uno::Reference< text::XFlatParagraph > xPara( xFlatPara );
352 if (!xPara.is())
353 return;
355 FPEntry aNewFPEntry;
356 aNewFPEntry.m_xParaIterator = xFlatParaIterator;
357 aNewFPEntry.m_xPara = xFlatPara;
358 aNewFPEntry.m_aDocId = rDocId;
359 aNewFPEntry.m_nStartIndex = nStartIndex;
360 aNewFPEntry.m_bAutomatic = bAutomatic;
362 // add new entry to the end of this queue
363 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
364 if (!m_thread)
365 m_thread = osl_createThread( lcl_workerfunc, this );
366 m_aFPEntriesQueue.push_back( aNewFPEntry );
368 // wake up the thread in order to do grammar checking
369 m_aWakeUpThread.set();
373 void GrammarCheckingIterator::ProcessResult(
374 const linguistic2::ProofreadingResult &rRes,
375 const uno::Reference< text::XFlatParagraphIterator > &rxFlatParagraphIterator,
376 bool bIsAutomaticChecking )
378 DBG_ASSERT( rRes.xFlatParagraph.is(), "xFlatParagraph is missing" );
379 //no guard necessary as no members are used
380 bool bContinueWithNextPara = false;
381 if (!rRes.xFlatParagraph.is() || rRes.xFlatParagraph->isModified())
383 // if paragraph was modified/deleted meanwhile continue with the next one...
384 bContinueWithNextPara = true;
386 else // paragraph is still unchanged...
388 // mark found errors...
390 sal_Int32 nTextLen = rRes.aText.getLength();
391 bool bBoundariesOk = 0 <= rRes.nStartOfSentencePosition && rRes.nStartOfSentencePosition <= nTextLen &&
392 0 <= rRes.nBehindEndOfSentencePosition && rRes.nBehindEndOfSentencePosition <= nTextLen &&
393 0 <= rRes.nStartOfNextSentencePosition && rRes.nStartOfNextSentencePosition <= nTextLen &&
394 rRes.nStartOfSentencePosition <= rRes.nBehindEndOfSentencePosition &&
395 rRes.nBehindEndOfSentencePosition <= rRes.nStartOfNextSentencePosition;
396 DBG_ASSERT( bBoundariesOk, "inconsistent sentence boundaries" );
398 uno::Reference< text::XMultiTextMarkup > xMulti( rRes.xFlatParagraph, uno::UNO_QUERY );
399 if (xMulti.is()) // use new API for markups
403 // length = number of found errors + 1 sentence markup
404 sal_Int32 nErrors = rRes.aErrors.getLength();
405 uno::Sequence< text::TextMarkupDescriptor > aDescriptors( nErrors + 1 );
406 text::TextMarkupDescriptor * pDescriptors = aDescriptors.getArray();
408 // at pos 0 .. nErrors-1 -> all grammar errors
409 for (const linguistic2::SingleProofreadingError &rError : rRes.aErrors)
411 text::TextMarkupDescriptor &rDesc = *pDescriptors++;
413 rDesc.nType = rError.nErrorType;
414 rDesc.nOffset = rError.nErrorStart;
415 rDesc.nLength = rError.nErrorLength;
417 // the proofreader may return SPELLING but right now our core
418 // does only handle PROOFREADING if the result is from the proofreader...
419 // (later on we may wish to color spelling errors found by the proofreader
420 // differently for example. But no special handling right now.
421 if (rDesc.nType == text::TextMarkupType::SPELLCHECK)
422 rDesc.nType = text::TextMarkupType::PROOFREADING;
424 uno::Reference< container::XStringKeyMap > xKeyMap(
425 new LngXStringKeyMap());
426 for( const beans::PropertyValue& rProperty : rError.aProperties )
428 if ( rProperty.Name == "LineColor" )
430 xKeyMap->insertValue(rProperty.Name,
431 rProperty.Value);
432 rDesc.xMarkupInfoContainer = xKeyMap;
434 else if ( rProperty.Name == "LineType" )
436 xKeyMap->insertValue(rProperty.Name,
437 rProperty.Value);
438 rDesc.xMarkupInfoContainer = xKeyMap;
443 // at pos nErrors -> sentence markup
444 // nSentenceLength: includes the white-spaces following the sentence end...
445 const sal_Int32 nSentenceLength = rRes.nStartOfNextSentencePosition - rRes.nStartOfSentencePosition;
446 pDescriptors->nType = text::TextMarkupType::SENTENCE;
447 pDescriptors->nOffset = rRes.nStartOfSentencePosition;
448 pDescriptors->nLength = nSentenceLength;
450 xMulti->commitMultiTextMarkup( aDescriptors ) ;
452 catch (lang::IllegalArgumentException &)
454 OSL_FAIL( "commitMultiTextMarkup: IllegalArgumentException exception caught" );
458 // other sentences left to be checked in this paragraph?
459 if (rRes.nStartOfNextSentencePosition < rRes.aText.getLength())
461 AddEntry( rxFlatParagraphIterator, rRes.xFlatParagraph, rRes.aDocumentIdentifier, rRes.nStartOfNextSentencePosition, bIsAutomaticChecking );
463 else // current paragraph finished
465 // set "already checked" flag for the current flat paragraph
466 if (rRes.xFlatParagraph.is())
467 rRes.xFlatParagraph->setChecked( text::TextMarkupType::PROOFREADING, true );
469 bContinueWithNextPara = true;
473 if (bContinueWithNextPara)
475 // we need to continue with the next paragraph
476 uno::Reference< text::XFlatParagraph > xFlatParaNext;
477 if (rxFlatParagraphIterator.is())
478 xFlatParaNext = rxFlatParagraphIterator->getNextPara();
480 AddEntry( rxFlatParagraphIterator, xFlatParaNext, rRes.aDocumentIdentifier, 0, bIsAutomaticChecking );
486 uno::Reference< linguistic2::XProofreader > GrammarCheckingIterator::GetGrammarChecker(
487 const lang::Locale &rLocale )
489 uno::Reference< linguistic2::XProofreader > xRes;
491 // ---- THREAD SAFE START ----
492 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
494 // check supported locales for each grammarchecker if not already done
495 if (!m_bGCServicesChecked)
497 GetConfiguredGCSvcs_Impl();
498 m_bGCServicesChecked = true;
501 const LanguageType nLang = LanguageTag::convertToLanguageType( rLocale, false);
502 GCImplNames_t::const_iterator aLangIt( m_aGCImplNamesByLang.find( nLang ) );
503 if (aLangIt != m_aGCImplNamesByLang.end()) // matching configured language found?
505 OUString aSvcImplName( aLangIt->second );
506 GCReferences_t::const_iterator aImplNameIt( m_aGCReferencesByService.find( aSvcImplName ) );
507 if (aImplNameIt != m_aGCReferencesByService.end()) // matching impl name found?
509 xRes = aImplNameIt->second;
511 else // the service is to be instantiated here for the first time...
515 uno::Reference< uno::XComponentContext > xContext( comphelper::getProcessComponentContext() );
516 uno::Reference< linguistic2::XProofreader > xGC(
517 xContext->getServiceManager()->createInstanceWithContext(aSvcImplName, xContext),
518 uno::UNO_QUERY_THROW );
519 uno::Reference< linguistic2::XSupportedLocales > xSuppLoc( xGC, uno::UNO_QUERY_THROW );
521 if (xSuppLoc->hasLocale( rLocale ))
523 m_aGCReferencesByService[ aSvcImplName ] = xGC;
524 xRes = xGC;
526 uno::Reference< linguistic2::XLinguServiceEventBroadcaster > xBC( xGC, uno::UNO_QUERY );
527 if (xBC.is())
528 xBC->addLinguServiceEventListener( this );
530 else
532 SAL_WARN( "linguistic", "grammar checker does not support required locale" );
535 catch (uno::Exception &)
537 SAL_WARN( "linguistic", "instantiating grammar checker failed" );
541 // ---- THREAD SAFE END ----
543 return xRes;
546 static uno::Sequence<beans::PropertyValue>
547 lcl_makeProperties(uno::Reference<text::XFlatParagraph> const& xFlatPara, sal_Int32 nProofInfo)
549 uno::Reference<beans::XPropertySet> const xProps(
550 xFlatPara, uno::UNO_QUERY_THROW);
551 css::uno::Any a (nProofInfo);
552 return comphelper::InitPropertySequence({
553 { "FieldPositions", xProps->getPropertyValue("FieldPositions") },
554 { "FootnotePositions", xProps->getPropertyValue("FootnotePositions") },
555 { "ProofInfo", a }
559 void GrammarCheckingIterator::DequeueAndCheck()
561 for (;;)
563 // ---- THREAD SAFE START ----
564 bool bQueueEmpty = false;
566 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
567 if (m_bEnd)
569 break;
571 bQueueEmpty = m_aFPEntriesQueue.empty();
573 // ---- THREAD SAFE END ----
575 if (!bQueueEmpty)
577 uno::Reference< text::XFlatParagraphIterator > xFPIterator;
578 uno::Reference< text::XFlatParagraph > xFlatPara;
579 FPEntry aFPEntryItem;
580 OUString aCurDocId;
581 // ---- THREAD SAFE START ----
583 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
584 aFPEntryItem = m_aFPEntriesQueue.front();
585 xFPIterator = aFPEntryItem.m_xParaIterator;
586 xFlatPara = aFPEntryItem.m_xPara;
587 m_aCurCheckedDocId = aFPEntryItem.m_aDocId;
588 aCurDocId = m_aCurCheckedDocId;
590 m_aFPEntriesQueue.pop_front();
592 // ---- THREAD SAFE END ----
594 if (xFlatPara.is() && xFPIterator.is())
598 OUString aCurTxt( xFlatPara->getText() );
599 lang::Locale aCurLocale = lcl_GetPrimaryLanguageOfSentence( xFlatPara, aFPEntryItem.m_nStartIndex );
601 const bool bModified = xFlatPara->isModified();
602 if (!bModified)
604 linguistic2::ProofreadingResult aRes;
606 // ---- THREAD SAFE START ----
608 osl::ClearableMutexGuard aGuard(MyMutex::get());
610 sal_Int32 nStartPos = aFPEntryItem.m_nStartIndex;
611 sal_Int32 nSuggestedEnd
612 = GetSuggestedEndOfSentence(aCurTxt, nStartPos, aCurLocale);
613 DBG_ASSERT((nSuggestedEnd == 0 && aCurTxt.isEmpty())
614 || nSuggestedEnd > nStartPos,
615 "nSuggestedEndOfSentencePos calculation failed?");
617 uno::Reference<linguistic2::XProofreader> xGC =
618 GetGrammarChecker(aCurLocale);
619 if (xGC.is())
621 aGuard.clear();
622 uno::Sequence<beans::PropertyValue> const aProps(
623 lcl_makeProperties(xFlatPara, PROOFINFO_MARK_PARAGRAPH));
624 aRes = xGC->doProofreading(aCurDocId, aCurTxt, aCurLocale,
625 nStartPos, nSuggestedEnd, aProps);
627 //!! work-around to prevent looping if the grammar checker
628 //!! failed to properly identify the sentence end
629 if (aRes.nBehindEndOfSentencePosition <= nStartPos
630 && aRes.nBehindEndOfSentencePosition != nSuggestedEnd)
632 SAL_WARN(
633 "linguistic",
634 "!! Grammarchecker failed to provide end of sentence !!");
635 aRes.nBehindEndOfSentencePosition = nSuggestedEnd;
638 aRes.xFlatParagraph = xFlatPara;
639 aRes.nStartOfSentencePosition = nStartPos;
641 else
643 // no grammar checker -> no error
644 // but we need to provide the data below in order to continue with the next sentence
645 aRes.aDocumentIdentifier = aCurDocId;
646 aRes.xFlatParagraph = xFlatPara;
647 aRes.aText = aCurTxt;
648 aRes.aLocale = aCurLocale;
649 aRes.nStartOfSentencePosition = nStartPos;
650 aRes.nBehindEndOfSentencePosition = nSuggestedEnd;
652 aRes.nStartOfNextSentencePosition
653 = lcl_SkipWhiteSpaces(aCurTxt, aRes.nBehindEndOfSentencePosition);
654 aRes.nBehindEndOfSentencePosition = lcl_BacktraceWhiteSpaces(
655 aCurTxt, aRes.nStartOfNextSentencePosition);
657 //guard has to be cleared as ProcessResult calls out of this class
659 // ---- THREAD SAFE END ----
660 ProcessResult( aRes, xFPIterator, aFPEntryItem.m_bAutomatic );
662 else
664 // the paragraph changed meanwhile... (and maybe is still edited)
665 // thus we simply continue to ask for the next to be checked.
666 uno::Reference< text::XFlatParagraph > xFlatParaNext( xFPIterator->getNextPara() );
667 AddEntry( xFPIterator, xFlatParaNext, aCurDocId, 0, aFPEntryItem.m_bAutomatic );
670 catch (css::uno::Exception &)
672 TOOLS_WARN_EXCEPTION("linguistic", "GrammarCheckingIterator::DequeueAndCheck ignoring");
676 // ---- THREAD SAFE START ----
678 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
679 m_aCurCheckedDocId.clear();
681 // ---- THREAD SAFE END ----
683 else
685 // ---- THREAD SAFE START ----
687 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
688 if (m_bEnd)
690 break;
692 // Check queue state again
693 if (m_aFPEntriesQueue.empty())
694 m_aWakeUpThread.reset();
696 // ---- THREAD SAFE END ----
698 //if the queue is empty
699 // IMPORTANT: Don't call condition.wait() with locked
700 // mutex. Otherwise you would keep out other threads
701 // to add entries to the queue! A condition is thread-
702 // safe implemented.
703 m_aWakeUpThread.wait();
709 void SAL_CALL GrammarCheckingIterator::startProofreading(
710 const uno::Reference< ::uno::XInterface > & xDoc,
711 const uno::Reference< text::XFlatParagraphIteratorProvider > & xIteratorProvider )
713 // get paragraph to start checking with
714 const bool bAutomatic = true;
715 uno::Reference<text::XFlatParagraphIterator> xFPIterator = xIteratorProvider->getFlatParagraphIterator(
716 text::TextMarkupType::PROOFREADING, bAutomatic );
717 uno::Reference< text::XFlatParagraph > xPara( xFPIterator.is()? xFPIterator->getFirstPara() : nullptr );
718 uno::Reference< lang::XComponent > xComponent( xDoc, uno::UNO_QUERY );
720 // ---- THREAD SAFE START ----
721 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
722 if (xPara.is() && xComponent.is())
724 OUString aDocId = GetOrCreateDocId( xComponent );
726 // create new entry and add it to queue
727 AddEntry( xFPIterator, xPara, aDocId, 0, bAutomatic );
729 // ---- THREAD SAFE END ----
733 linguistic2::ProofreadingResult SAL_CALL GrammarCheckingIterator::checkSentenceAtPosition(
734 const uno::Reference< uno::XInterface >& xDoc,
735 const uno::Reference< text::XFlatParagraph >& xFlatPara,
736 const OUString& rText,
737 const lang::Locale&,
738 sal_Int32 nStartOfSentencePos,
739 sal_Int32 nSuggestedEndOfSentencePos,
740 sal_Int32 nErrorPosInPara )
742 // for the context menu...
744 linguistic2::ProofreadingResult aRes;
746 uno::Reference< lang::XComponent > xComponent( xDoc, uno::UNO_QUERY );
747 if (xFlatPara.is() && xComponent.is() &&
748 ( nErrorPosInPara < 0 || nErrorPosInPara < rText.getLength()))
750 // iterate through paragraph until we find the sentence we are interested in
751 linguistic2::ProofreadingResult aTmpRes;
752 sal_Int32 nStartPos = nStartOfSentencePos >= 0 ? nStartOfSentencePos : 0;
754 bool bFound = false;
757 lang::Locale aCurLocale = lcl_GetPrimaryLanguageOfSentence( xFlatPara, nStartPos );
758 sal_Int32 nOldStartOfSentencePos = nStartPos;
759 uno::Reference< linguistic2::XProofreader > xGC;
760 OUString aDocId;
762 // ---- THREAD SAFE START ----
764 ::osl::ClearableGuard< ::osl::Mutex > aGuard( MyMutex::get() );
765 aDocId = GetOrCreateDocId( xComponent );
766 nSuggestedEndOfSentencePos = GetSuggestedEndOfSentence( rText, nStartPos, aCurLocale );
767 DBG_ASSERT( nSuggestedEndOfSentencePos > nStartPos, "nSuggestedEndOfSentencePos calculation failed?" );
769 xGC = GetGrammarChecker( aCurLocale );
771 // ---- THREAD SAFE START ----
772 sal_Int32 nEndPos = -1;
773 if (xGC.is())
775 uno::Sequence<beans::PropertyValue> const aProps(
776 lcl_makeProperties(xFlatPara, PROOFINFO_GET_PROOFRESULT));
777 aTmpRes = xGC->doProofreading( aDocId, rText,
778 aCurLocale, nStartPos, nSuggestedEndOfSentencePos, aProps );
780 //!! work-around to prevent looping if the grammar checker
781 //!! failed to properly identify the sentence end
782 if (aTmpRes.nBehindEndOfSentencePosition <= nStartPos)
784 SAL_WARN( "linguistic", "!! Grammarchecker failed to provide end of sentence !!" );
785 aTmpRes.nBehindEndOfSentencePosition = nSuggestedEndOfSentencePos;
788 aTmpRes.xFlatParagraph = xFlatPara;
789 aTmpRes.nStartOfSentencePosition = nStartPos;
790 nEndPos = aTmpRes.nBehindEndOfSentencePosition;
792 if ((nErrorPosInPara< 0 || nStartPos <= nErrorPosInPara) && nErrorPosInPara < nEndPos)
793 bFound = true;
795 if (nEndPos == -1) // no result from grammar checker
796 nEndPos = nSuggestedEndOfSentencePos;
797 nStartPos = lcl_SkipWhiteSpaces( rText, nEndPos );
798 aTmpRes.nBehindEndOfSentencePosition = nEndPos;
799 aTmpRes.nStartOfNextSentencePosition = nStartPos;
800 aTmpRes.nBehindEndOfSentencePosition = lcl_BacktraceWhiteSpaces( rText, aTmpRes.nStartOfNextSentencePosition );
802 // prevent endless loop by forcefully advancing if needs be...
803 if (nStartPos <= nOldStartOfSentencePos)
805 SAL_WARN( "linguistic", "end-of-sentence detection failed?" );
806 nStartPos = nOldStartOfSentencePos + 1;
809 while (!bFound && nStartPos < rText.getLength());
811 if (bFound && !xFlatPara->isModified())
812 aRes = aTmpRes;
815 return aRes;
819 sal_Int32 GrammarCheckingIterator::GetSuggestedEndOfSentence(
820 const OUString &rText,
821 sal_Int32 nSentenceStartPos,
822 const lang::Locale &rLocale )
824 // internal method; will always be called with locked mutex
826 if (!m_xBreakIterator.is())
828 uno::Reference< uno::XComponentContext > xContext = ::comphelper::getProcessComponentContext();
829 m_xBreakIterator = i18n::BreakIterator::create(xContext);
831 sal_Int32 nTextLen = rText.getLength();
832 sal_Int32 nEndPosition(0);
833 sal_Int32 nTmpStartPos = nSentenceStartPos;
836 sal_Int32 const nPrevEndPosition(nEndPosition);
837 nEndPosition = nTextLen;
838 if (nTmpStartPos < nTextLen)
840 nEndPosition = m_xBreakIterator->endOfSentence( rText, nTmpStartPos, rLocale );
841 if (nEndPosition <= nPrevEndPosition)
843 // fdo#68750 if there's no progress at all then presumably
844 // there's no end of sentence in this paragraph so just
845 // set the end position to end of paragraph
846 nEndPosition = nTextLen;
849 if (nEndPosition < 0)
850 nEndPosition = nTextLen;
852 ++nTmpStartPos;
854 while (nEndPosition <= nSentenceStartPos && nEndPosition < nTextLen);
855 if (nEndPosition > nTextLen)
856 nEndPosition = nTextLen;
857 return nEndPosition;
861 void SAL_CALL GrammarCheckingIterator::resetIgnoreRules( )
863 for (auto const& elem : m_aGCReferencesByService)
865 uno::Reference< linguistic2::XProofreader > xGC(elem.second);
866 if (xGC.is())
867 xGC->resetIgnoreRules();
872 sal_Bool SAL_CALL GrammarCheckingIterator::isProofreading(
873 const uno::Reference< uno::XInterface >& xDoc )
875 // ---- THREAD SAFE START ----
876 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
878 bool bRes = false;
880 uno::Reference< lang::XComponent > xComponent( xDoc, uno::UNO_QUERY );
881 if (xComponent.is())
883 // if the component was already used in one of the two calls to check text
884 // i.e. in startGrammarChecking or checkGrammarAtPos it will be found in the
885 // m_aDocIdMap unless the document already disposed.
886 // If it is not found then it is not yet being checked (or requested to being checked)
887 const DocMap_t::const_iterator aIt( m_aDocIdMap.find( xComponent.get() ) );
888 if (aIt != m_aDocIdMap.end())
890 // check in document is checked automatically in the background...
891 OUString aDocId = aIt->second;
892 if (!m_aCurCheckedDocId.isEmpty() && m_aCurCheckedDocId == aDocId)
894 // an entry for that document was dequeued and is currently being checked.
895 bRes = true;
897 else
899 // we need to check if there is an entry for that document in the queue...
900 // That is the document is going to be checked sooner or later.
902 sal_Int32 nSize = m_aFPEntriesQueue.size();
903 for (sal_Int32 i = 0; i < nSize && !bRes; ++i)
905 if (aDocId == m_aFPEntriesQueue[i].m_aDocId)
906 bRes = true;
911 // ---- THREAD SAFE END ----
913 return bRes;
917 void SAL_CALL GrammarCheckingIterator::processLinguServiceEvent(
918 const linguistic2::LinguServiceEvent& rLngSvcEvent )
920 if (rLngSvcEvent.nEvent != linguistic2::LinguServiceEventFlags::PROOFREAD_AGAIN)
921 return;
925 uno::Reference< uno::XInterface > xThis( static_cast< OWeakObject * >(this) );
926 linguistic2::LinguServiceEvent aEvent( xThis, linguistic2::LinguServiceEventFlags::PROOFREAD_AGAIN );
927 m_aNotifyListeners.notifyEach(
928 &linguistic2::XLinguServiceEventListener::processLinguServiceEvent,
929 aEvent);
931 catch (uno::RuntimeException &)
933 throw;
935 catch (const ::uno::Exception &)
937 // ignore
938 TOOLS_WARN_EXCEPTION("linguistic", "processLinguServiceEvent");
943 sal_Bool SAL_CALL GrammarCheckingIterator::addLinguServiceEventListener(
944 const uno::Reference< linguistic2::XLinguServiceEventListener >& xListener )
946 if (xListener.is())
948 m_aNotifyListeners.addInterface( xListener );
950 return true;
954 sal_Bool SAL_CALL GrammarCheckingIterator::removeLinguServiceEventListener(
955 const uno::Reference< linguistic2::XLinguServiceEventListener >& xListener )
957 if (xListener.is())
959 m_aNotifyListeners.removeInterface( xListener );
961 return true;
965 void SAL_CALL GrammarCheckingIterator::dispose()
967 lang::EventObject aEvt( static_cast<linguistic2::XProofreadingIterator *>(this) );
968 m_aEventListeners.disposeAndClear( aEvt );
970 TerminateThread();
972 // ---- THREAD SAFE START ----
974 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
976 // release all UNO references
978 m_xBreakIterator.clear();
980 // clear containers with UNO references AND have those references released
981 GCReferences_t aTmpEmpty1;
982 DocMap_t aTmpEmpty2;
983 FPQueue_t aTmpEmpty3;
984 m_aGCReferencesByService.swap( aTmpEmpty1 );
985 m_aDocIdMap.swap( aTmpEmpty2 );
986 m_aFPEntriesQueue.swap( aTmpEmpty3 );
988 // ---- THREAD SAFE END ----
992 void SAL_CALL GrammarCheckingIterator::addEventListener(
993 const uno::Reference< lang::XEventListener >& xListener )
995 if (xListener.is())
997 m_aEventListeners.addInterface( xListener );
1002 void SAL_CALL GrammarCheckingIterator::removeEventListener(
1003 const uno::Reference< lang::XEventListener >& xListener )
1005 if (xListener.is())
1007 m_aEventListeners.removeInterface( xListener );
1012 void SAL_CALL GrammarCheckingIterator::disposing( const lang::EventObject &rSource )
1014 // if the component (document) is disposing release all references
1015 //!! There is no need to remove entries from the queue that are from this document
1016 //!! since the respectives xFlatParagraphs should become invalid (isModified() == true)
1017 //!! and the call to xFlatParagraphIterator->getNextPara() will result in an empty reference.
1018 //!! And if an entry is currently checked by a grammar checker upon return the results
1019 //!! should be ignored.
1020 //!! Also GetOrCreateDocId will not use that very same Id again...
1021 //!! All of the above resulting in that we only have to get rid of the implementation pointer here.
1022 uno::Reference< lang::XComponent > xDoc( rSource.Source, uno::UNO_QUERY );
1023 if (xDoc.is())
1025 // ---- THREAD SAFE START ----
1026 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
1027 m_aDocIdMap.erase( xDoc.get() );
1028 // ---- THREAD SAFE END ----
1033 uno::Reference< util::XChangesBatch > const & GrammarCheckingIterator::GetUpdateAccess() const
1035 if (!m_xUpdateAccess.is())
1039 // get configuration provider
1040 uno::Reference< uno::XComponentContext > xContext = comphelper::getProcessComponentContext();
1041 uno::Reference< lang::XMultiServiceFactory > xConfigurationProvider =
1042 configuration::theDefaultProvider::get( xContext );
1044 // get configuration update access
1045 beans::PropertyValue aValue;
1046 aValue.Name = "nodepath";
1047 aValue.Value <<= OUString("org.openoffice.Office.Linguistic/ServiceManager");
1048 uno::Sequence< uno::Any > aProps(1);
1049 aProps[0] <<= aValue;
1050 m_xUpdateAccess.set(
1051 xConfigurationProvider->createInstanceWithArguments(
1052 "com.sun.star.configuration.ConfigurationUpdateAccess", aProps ),
1053 uno::UNO_QUERY_THROW );
1055 catch (uno::Exception &)
1060 return m_xUpdateAccess;
1064 void GrammarCheckingIterator::GetConfiguredGCSvcs_Impl()
1066 GCImplNames_t aTmpGCImplNamesByLang;
1070 // get node names (locale iso strings) for configured grammar checkers
1071 uno::Reference< container::XNameAccess > xNA( GetUpdateAccess(), uno::UNO_QUERY_THROW );
1072 xNA.set( xNA->getByName( "GrammarCheckerList" ), uno::UNO_QUERY_THROW );
1073 const uno::Sequence< OUString > aElementNames( xNA->getElementNames() );
1075 for (const OUString& rElementName : aElementNames)
1077 uno::Sequence< OUString > aImplNames;
1078 uno::Any aTmp( xNA->getByName( rElementName ) );
1079 if (aTmp >>= aImplNames)
1081 if (aImplNames.hasElements())
1083 // only the first entry is used, there should be only one grammar checker per language
1084 const OUString aImplName( aImplNames[0] );
1085 const LanguageType nLang = LanguageTag::convertToLanguageType( rElementName );
1086 aTmpGCImplNamesByLang[ nLang ] = aImplName;
1089 else
1091 SAL_WARN( "linguistic", "failed to get aImplNames. Wrong type?" );
1095 catch (uno::Exception const &)
1097 TOOLS_WARN_EXCEPTION( "linguistic", "exception caught. Failed to get configured services" );
1101 // ---- THREAD SAFE START ----
1102 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
1103 m_aGCImplNamesByLang = aTmpGCImplNamesByLang;
1104 // ---- THREAD SAFE END ----
1109 sal_Bool SAL_CALL GrammarCheckingIterator::supportsService(
1110 const OUString & rServiceName )
1112 return cppu::supportsService(this, rServiceName);
1116 OUString SAL_CALL GrammarCheckingIterator::getImplementationName( )
1118 return "com.sun.star.lingu2.ProofreadingIterator";
1122 uno::Sequence< OUString > SAL_CALL GrammarCheckingIterator::getSupportedServiceNames( )
1124 return { "com.sun.star.linguistic2.ProofreadingIterator" };
1128 void GrammarCheckingIterator::SetServiceList(
1129 const lang::Locale &rLocale,
1130 const uno::Sequence< OUString > &rSvcImplNames )
1132 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
1134 LanguageType nLanguage = LinguLocaleToLanguage( rLocale );
1135 OUString aImplName;
1136 if (rSvcImplNames.hasElements())
1137 aImplName = rSvcImplNames[0]; // there is only one grammar checker per language
1139 if (!LinguIsUnspecified(nLanguage) && nLanguage != LANGUAGE_DONTKNOW)
1141 if (!aImplName.isEmpty())
1142 m_aGCImplNamesByLang[ nLanguage ] = aImplName;
1143 else
1144 m_aGCImplNamesByLang.erase( nLanguage );
1149 uno::Sequence< OUString > GrammarCheckingIterator::GetServiceList(
1150 const lang::Locale &rLocale ) const
1152 ::osl::Guard< ::osl::Mutex > aGuard( MyMutex::get() );
1154 uno::Sequence< OUString > aRes(1);
1156 OUString aImplName; // there is only one grammar checker per language
1157 LanguageType nLang = LinguLocaleToLanguage( rLocale );
1158 GCImplNames_t::const_iterator aIt( m_aGCImplNamesByLang.find( nLang ) );
1159 if (aIt != m_aGCImplNamesByLang.end())
1160 aImplName = aIt->second;
1162 if (!aImplName.isEmpty())
1163 aRes[0] = aImplName;
1164 else
1165 aRes.realloc(0);
1167 return aRes;
1171 extern "C" SAL_DLLPUBLIC_EXPORT css::uno::XInterface*
1172 linguistic_GrammarCheckingIterator_get_implementation(
1173 css::uno::XComponentContext* , css::uno::Sequence<css::uno::Any> const&)
1175 return cppu::acquire(static_cast<cppu::OWeakObject*>(new GrammarCheckingIterator()));
1180 /* vim:set shiftwidth=4 softtabstop=4 expandtab: */