diff --git a/PdfForQtLib/sources/pdfexecutionpolicy.cpp b/PdfForQtLib/sources/pdfexecutionpolicy.cpp index f18b30d..67dc4f5 100644 --- a/PdfForQtLib/sources/pdfexecutionpolicy.cpp +++ b/PdfForQtLib/sources/pdfexecutionpolicy.cpp @@ -19,13 +19,26 @@ #include "pdfexecutionpolicy.h" #include +#include namespace pdf { struct PDFExecutionPolicyHolder { + PDFExecutionPolicyHolder() + { + qAddPostRoutine(&PDFExecutionPolicy::finalize); + } + ~PDFExecutionPolicyHolder() + { + auxiliary.waitForDone(); + primary.waitForDone(); + } + PDFExecutionPolicy policy; + QThreadPool primary; + QThreadPool auxiliary; } s_execution_policy; void PDFExecutionPolicy::setStrategy(Strategy strategy) @@ -50,13 +63,7 @@ bool PDFExecutionPolicy::isParallelizing(Scope scope) return true; // We are parallelizing pages... case Scope::Content: - { - // Jakub Melka: this is a bit complicated. We must count number of content streams - // being processed and if it is large enough, then do not parallelize. - const size_t threadLimit = s_execution_policy.policy.m_threadLimit.load(std::memory_order_relaxed); - const size_t contentStreamsCount = s_execution_policy.policy.m_contentStreamsCount.load(std::memory_order_seq_cst); - return contentStreamsCount < threadLimit; - } + return false; } break; @@ -71,6 +78,34 @@ bool PDFExecutionPolicy::isParallelizing(Scope scope) return false; } +int PDFExecutionPolicy::getActiveThreadCount(Scope scope) +{ + return getThreadPool(scope)->activeThreadCount(); +} + +int PDFExecutionPolicy::getMaxThreadCount(Scope scope) +{ + return getThreadPool(scope)->maxThreadCount(); +} + +void PDFExecutionPolicy::setMaxThreadCount(Scope scope, int count) +{ + // Sanitize value! + count = qMax(count, 1); + getThreadPool(scope)->setMaxThreadCount(count); +} + +int PDFExecutionPolicy::getIdealThreadCount(Scope scope) +{ + Q_UNUSED(scope); + return QThread::idealThreadCount(); +} + +int PDFExecutionPolicy::getContentStreamCount() +{ + return s_execution_policy.policy.m_contentStreamsCount.load(std::memory_order_relaxed); +} + void PDFExecutionPolicy::startProcessingContentStream() { ++s_execution_policy.policy.m_contentStreamsCount; @@ -81,9 +116,33 @@ void PDFExecutionPolicy::endProcessingContentStream() --s_execution_policy.policy.m_contentStreamsCount; } +void PDFExecutionPolicy::finalize() +{ + s_execution_policy.auxiliary.waitForDone(); + s_execution_policy.primary.waitForDone(); +} + +QThreadPool* PDFExecutionPolicy::getThreadPool(PDFExecutionPolicy::Scope scope) +{ + switch (scope) + { + case Scope::Page: + case Scope::Unknown: + return &s_execution_policy.primary; + + case Scope::Content: + return &s_execution_policy.auxiliary; + + default: + Q_ASSERT(false); + break; + } + + return nullptr; +} + PDFExecutionPolicy::PDFExecutionPolicy() : m_contentStreamsCount(0), - m_threadLimit(QThread::idealThreadCount()), m_strategy(Strategy::PageMultithreaded) { diff --git a/PdfForQtLib/sources/pdfexecutionpolicy.h b/PdfForQtLib/sources/pdfexecutionpolicy.h index 1f43c63..7d14544 100644 --- a/PdfForQtLib/sources/pdfexecutionpolicy.h +++ b/PdfForQtLib/sources/pdfexecutionpolicy.h @@ -20,6 +20,9 @@ #include "pdfglobal.h" +#include +#include + #include #include @@ -53,15 +56,48 @@ public: static void setStrategy(Strategy strategy); /// Determines, if we should parallelize for scope - /// \param scope Scope for which we want to determine exectution policy + /// \param scope Scope for which we want to determine execution policy static bool isParallelizing(Scope scope); + template + class Runnable : public QRunnable + { + public: + explicit inline Runnable(ForwardIt it, UnaryFunction* function, QSemaphore* semaphore) : + m_forwardIt(qMove(it)), + m_function(function), + m_semaphore(semaphore) + { + setAutoDelete(true); + } + + virtual void run() override + { + QSemaphoreReleaser semaphoreReleaser(m_semaphore); + (*m_function)(*m_forwardIt); + } + + private: + ForwardIt m_forwardIt; + UnaryFunction* m_function; + QSemaphore* m_semaphore; + }; + template static void execute(Scope scope, ForwardIt first, ForwardIt last, UnaryFunction f) { if (isParallelizing(scope)) { - std::for_each(std::execution::parallel_policy(), first, last, f); + QSemaphore semaphore(0); + int count = static_cast(std::distance(first, last)); + + QThreadPool* pool = getThreadPool(scope); + for (auto it = first; it != last; ++it) + { + pool->start(new Runnable(it, &f, &semaphore)); + } + + semaphore.acquire(count); } else { @@ -72,29 +108,45 @@ public: template static void sort(Scope scope, ForwardIt first, ForwardIt last, Comparator f) { - if (isParallelizing(scope)) - { - std::sort(std::execution::parallel_policy(), first, last, f); - } - else - { - std::sort(std::execution::sequenced_policy(), first, last, f); - } + Q_UNUSED(scope); + + // We always sort by single thread + std::sort(std::execution::sequenced_policy(), first, last, f); } + /// Returns number of active threads for given scope + static int getActiveThreadCount(Scope scope); + + /// Returns maximal number of threads for given scope + static int getMaxThreadCount(Scope scope); + + /// Sets maximal number of threads for given scope + static void setMaxThreadCount(Scope scope, int count); + + /// Returns ideal thread count for given scope + static int getIdealThreadCount(Scope scope); + + /// Returns number of currently processed content streams + static int getContentStreamCount(); + /// Starts processing content stream static void startProcessingContentStream(); /// Ends processing content stream static void endProcessingContentStream(); + /// Finalize multithreading - must be called at the end of program + static void finalize(); + private: friend struct PDFExecutionPolicyHolder; + /// Returns thread pool based on scope + static QThreadPool* getThreadPool(Scope scope); + explicit PDFExecutionPolicy(); - std::atomic m_contentStreamsCount; - std::atomic m_threadLimit; + std::atomic m_contentStreamsCount; std::atomic m_strategy; }; diff --git a/PdfForQtViewer/pdfviewersettings.cpp b/PdfForQtViewer/pdfviewersettings.cpp index d3ffc0c..ee65fed 100644 --- a/PdfForQtViewer/pdfviewersettings.cpp +++ b/PdfForQtViewer/pdfviewersettings.cpp @@ -253,7 +253,7 @@ PDFViewerSettings::Settings::Settings() : m_thumbnailsCacheLimit(PIXMAP_CACHE_LIMIT), m_fontCacheLimit(pdf::DEFAULT_FONT_CACHE_LIMIT), m_instancedFontCacheLimit(pdf::DEFAULT_REALIZED_FONT_CACHE_LIMIT), - m_multithreadingStrategy(pdf::PDFExecutionPolicy::Strategy::PageMultithreaded), + m_multithreadingStrategy(pdf::PDFExecutionPolicy::Strategy::AlwaysMultithreaded), m_speechRate(0.0), m_speechPitch(0.0), m_speechVolume(1.0), diff --git a/PdfForQtViewer/pdfviewersettings.h b/PdfForQtViewer/pdfviewersettings.h index 869bd54..0c96484 100644 --- a/PdfForQtViewer/pdfviewersettings.h +++ b/PdfForQtViewer/pdfviewersettings.h @@ -57,7 +57,7 @@ public: pdf::PDFReal m_colorTolerance; bool m_allowLaunchApplications; bool m_allowLaunchURI; - pdf::PDFExecutionPolicy::Strategy m_multithreadingStrategy = pdf::PDFExecutionPolicy::Strategy::PageMultithreaded; + pdf::PDFExecutionPolicy::Strategy m_multithreadingStrategy; // Cache settings int m_compiledPageCacheLimit; diff --git a/PdfForQtViewer/pdfviewersettingsdialog.ui b/PdfForQtViewer/pdfviewersettingsdialog.ui index 5f9cf2f..2dfc9e1 100644 --- a/PdfForQtViewer/pdfviewersettingsdialog.ui +++ b/PdfForQtViewer/pdfviewersettingsdialog.ui @@ -26,7 +26,7 @@ - 10 + 0 @@ -113,7 +113,7 @@ - <html><head/><body><p>Select rendering method according to your needs. <span style=" font-weight:600;">Software rendering</span> is much slower than hardware accelerated rendering using <span style=" font-weight:600;">OpenGL rendering</span>, but it works when OpenGL is not available at your platform. OpenGL rendering is selected as default and is recommended.</p><p>OpenGL rendering uses<span style=" font-weight:600;"> multisample antialiasing (MSAA)</span>, which provides good quality antialiasing. You can turn this feature on or off, but without antialiasing, bad quality image can occur. Samples count affect how much samples per pixel are considered to determine pixel color. It can be a value 1, 2, 4, 8, and 16. Most modern GPUs support at least value 8. Lower this value, if your GPU doesn't support the desired sample count.</p><p><span style=" font-weight:600;">Prefetch pages </span>prefetches (pre-renders) pages next to currently viewed pages, to avoid flickering during scrolling. Prefetched pages are stored in the page cache.</p><p><span style=" font-weight:600;">Multithreading strategy </span>defines how program will use CPU cores. Engine can use multiple cores. Strategy defines, how engine will use these cores. <span style=" font-weight:600;">Single thread</span> strategy uses only one CPU core for rendering page, and for some operations, they aren't parallelized, at the cost of more time needed for operation to be finished. But still, each page will use its own thread to be compiled/drawn. On the other side, there are two multithreading strategies, former is load balanced, latter uses maximum threads. Load balanced strategy tries to optimize number of threads to fit CPU cores, while maximum threads strategy will spawn as much threads as possible to process operations, which can be sometimes unoptimal.</p></body></html> + <html><head/><body><p>Select rendering method according to your needs. <span style=" font-weight:600;">Software rendering</span> is much slower than hardware accelerated rendering using <span style=" font-weight:600;">OpenGL rendering</span>, but it works when OpenGL is not available at your platform. OpenGL rendering is selected as default and is recommended.</p><p>OpenGL rendering uses<span style=" font-weight:600;"> multisample antialiasing (MSAA)</span>, which provides good quality antialiasing. You can turn this feature on or off, but without antialiasing, bad quality image can occur. Samples count affect how much samples per pixel are considered to determine pixel color. It can be a value 1, 2, 4, 8, and 16. Most modern GPUs support at least value 8. Lower this value, if your GPU doesn't support the desired sample count.</p><p><span style=" font-weight:600;">Prefetch pages </span>prefetches (pre-renders) pages next to currently viewed pages, to avoid flickering during scrolling. Prefetched pages are stored in the page cache.</p><p><span style=" font-weight:600;">Multithreading strategy </span>defines how program will use CPU cores. Engine can use multiple cores. Strategy defines, how engine will use these cores. <span style=" font-weight:600;">Single thread</span> strategy uses only one CPU core for rendering page, and for some operations, they aren't parallelized, at the cost of more time needed for operation to be finished. But still, each page will use its own thread to be compiled/drawn. On the other side, there are two multithreading strategies, former is load balanced, latter uses maximum threads. Load balanced strategy parallelizes only pages, but not processing each individual page content, while maximum threads strategy will spawn as much threads as possible to process operations to achieve best performance.</p></body></html> true