mirror of
https://github.com/JakubMelka/PDF4QT.git
synced 2025-01-28 08:09:28 +01:00
595 lines
18 KiB
C++
595 lines
18 KiB
C++
// Copyright (C) 2019-2022 Jakub Melka
|
|
//
|
|
// This file is part of PDF4QT.
|
|
//
|
|
// PDF4QT is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU Lesser General Public License as published by
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
// with the written consent of the copyright owner, any later version.
|
|
//
|
|
// PDF4QT is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU Lesser General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Lesser General Public License
|
|
// along with PDF4QT. If not, see <https://www.gnu.org/licenses/>.
|
|
|
|
#include "pdfcompiler.h"
|
|
#include "pdfcms.h"
|
|
#include "pdfprogress.h"
|
|
#include "pdfexecutionpolicy.h"
|
|
#include "pdftextlayoutgenerator.h"
|
|
#include "pdfdrawspacecontroller.h"
|
|
|
|
#include <QCache>
|
|
#include <QtConcurrent/QtConcurrent>
|
|
|
|
#include "pdfdbgheap.h"
|
|
|
|
#include <execution>
|
|
|
|
namespace pdf
|
|
{
|
|
|
|
PDFAsynchronousPageCompilerWorkerThread::PDFAsynchronousPageCompilerWorkerThread(PDFAsynchronousPageCompiler* parent) :
|
|
QThread(parent),
|
|
m_compiler(parent),
|
|
m_mutex(&m_compiler->m_mutex),
|
|
m_waitCondition(&m_compiler->m_waitCondition)
|
|
{
|
|
|
|
}
|
|
|
|
void PDFAsynchronousPageCompilerWorkerThread::run()
|
|
{
|
|
QMutexLocker locker(m_mutex);
|
|
while (!isInterruptionRequested())
|
|
{
|
|
if (m_waitCondition->wait(locker.mutex(), QDeadlineTimer(QDeadlineTimer::Forever)))
|
|
{
|
|
while (!isInterruptionRequested())
|
|
{
|
|
std::vector<PDFAsynchronousPageCompiler::CompileTask> tasks;
|
|
for (auto& task : m_compiler->m_tasks)
|
|
{
|
|
if (!task.second.finished)
|
|
{
|
|
tasks.push_back(task.second);
|
|
}
|
|
}
|
|
|
|
if (!tasks.empty())
|
|
{
|
|
locker.unlock();
|
|
|
|
// Perform page compilation
|
|
auto proxy = m_compiler->getProxy();
|
|
proxy->getFontCache()->setCacheShrinkEnabled(this, false);
|
|
|
|
auto compilePage = [this, proxy](PDFAsynchronousPageCompiler::CompileTask& task) -> PDFPrecompiledPage
|
|
{
|
|
PDFPrecompiledPage compiledPage;
|
|
PDFCMSPointer cms = proxy->getCMSManager()->getCurrentCMS();
|
|
PDFRenderer renderer(proxy->getDocument(), proxy->getFontCache(), cms.data(), proxy->getOptionalContentActivity(), proxy->getFeatures(), proxy->getMeshQualitySettings());
|
|
renderer.setOperationControl(m_compiler);
|
|
renderer.compile(&task.precompiledPage, task.pageIndex);
|
|
task.finished = true;
|
|
return compiledPage;
|
|
};
|
|
PDFExecutionPolicy::execute(PDFExecutionPolicy::Scope::Page, tasks.begin(), tasks.end(), compilePage);
|
|
|
|
proxy->getFontCache()->setCacheShrinkEnabled(this, true);
|
|
|
|
// Relock the mutex to write the tasks
|
|
locker.relock();
|
|
|
|
// Now, write compiled pages
|
|
bool isSomethingWritten = false;
|
|
for (auto& task : tasks)
|
|
{
|
|
if (task.finished)
|
|
{
|
|
isSomethingWritten = true;
|
|
m_compiler->m_tasks[task.pageIndex] = std::move(task);
|
|
}
|
|
}
|
|
|
|
if (isSomethingWritten)
|
|
{
|
|
// Why we are unlocking the mutex? Because
|
|
// we do not want to emit signals with locked mutexes.
|
|
// If direct connection is applied, this can lead to deadlock.
|
|
locker.unlock();
|
|
Q_EMIT pageCompiled();
|
|
locker.relock();
|
|
}
|
|
}
|
|
else
|
|
{
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
PDFAsynchronousPageCompiler::PDFAsynchronousPageCompiler(PDFDrawWidgetProxy* proxy) :
|
|
BaseClass(proxy),
|
|
m_proxy(proxy),
|
|
m_cache(new QCache<PDFInteger, PDFPrecompiledPage>())
|
|
{
|
|
m_cache->setMaxCost(128 * 1024 * 1024);
|
|
}
|
|
|
|
PDFAsynchronousPageCompiler::~PDFAsynchronousPageCompiler()
|
|
{
|
|
stop(true);
|
|
|
|
delete m_cache;
|
|
m_cache = nullptr;
|
|
}
|
|
|
|
bool PDFAsynchronousPageCompiler::isOperationCancelled() const
|
|
{
|
|
return m_state == State::Stopping;
|
|
}
|
|
|
|
void PDFAsynchronousPageCompiler::start()
|
|
{
|
|
switch (m_state)
|
|
{
|
|
case State::Inactive:
|
|
{
|
|
Q_ASSERT(!m_thread);
|
|
m_state = State::Active;
|
|
m_thread = new PDFAsynchronousPageCompilerWorkerThread(this);
|
|
connect(m_thread, &PDFAsynchronousPageCompilerWorkerThread::pageCompiled, this, &PDFAsynchronousPageCompiler::onPageCompiled);
|
|
m_thread->start();
|
|
break;
|
|
}
|
|
|
|
case State::Active:
|
|
break; // We have nothing to do...
|
|
|
|
case State::Stopping:
|
|
{
|
|
// We shouldn't call this function while stopping!
|
|
Q_ASSERT(false);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
void PDFAsynchronousPageCompiler::stop(bool clearCache)
|
|
{
|
|
switch (m_state)
|
|
{
|
|
case State::Inactive:
|
|
{
|
|
Q_ASSERT(!m_thread);
|
|
break; // We have nothing to do...
|
|
}
|
|
|
|
case State::Active:
|
|
{
|
|
// Stop the engine
|
|
m_state = State::Stopping;
|
|
|
|
Q_ASSERT(m_thread);
|
|
m_thread->requestInterruption();
|
|
m_waitCondition.wakeAll();
|
|
m_thread->wait();
|
|
delete m_thread;
|
|
m_thread = nullptr;
|
|
|
|
// It is safe to do not use mutex, because
|
|
// we have ended the work thread.
|
|
m_tasks.clear();
|
|
|
|
if (clearCache)
|
|
{
|
|
m_cache->clear();
|
|
}
|
|
|
|
m_state = State::Inactive;
|
|
break;
|
|
}
|
|
|
|
case State::Stopping:
|
|
{
|
|
// We shouldn't call this function while stopping!
|
|
Q_ASSERT(false);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
void PDFAsynchronousPageCompiler::reset()
|
|
{
|
|
stop(true);
|
|
start();
|
|
}
|
|
|
|
void PDFAsynchronousPageCompiler::setCacheLimit(int limit)
|
|
{
|
|
m_cache->setMaxCost(limit);
|
|
}
|
|
|
|
const PDFPrecompiledPage* PDFAsynchronousPageCompiler::getCompiledPage(PDFInteger pageIndex, bool compile)
|
|
{
|
|
if (m_state != State::Active || !m_proxy->getDocument())
|
|
{
|
|
// Engine is not active, always return nullptr
|
|
return nullptr;
|
|
}
|
|
|
|
PDFPrecompiledPage* page = m_cache->object(pageIndex);
|
|
|
|
if (!page && compile)
|
|
{
|
|
QMutexLocker locker(&m_mutex);
|
|
if (!m_tasks.count(pageIndex))
|
|
{
|
|
m_tasks.insert(std::make_pair(pageIndex, CompileTask(pageIndex)));
|
|
m_waitCondition.wakeOne();
|
|
}
|
|
}
|
|
|
|
if (page)
|
|
{
|
|
page->markAccessed();
|
|
}
|
|
|
|
return page;
|
|
}
|
|
|
|
void PDFAsynchronousPageCompiler::smartClearCache(const int milisecondsLimit, const std::vector<PDFInteger>& activePages)
|
|
{
|
|
if (m_state != State::Active)
|
|
{
|
|
// Jakub Melka: Cache clearing can be done only in active state
|
|
return;
|
|
}
|
|
|
|
QMutexLocker locker(&m_mutex);
|
|
|
|
Q_ASSERT(std::is_sorted(activePages.cbegin(), activePages.cend()));
|
|
|
|
QList<PDFInteger> pageIndices = m_cache->keys();
|
|
for (const PDFInteger pageIndex : pageIndices)
|
|
{
|
|
if (std::binary_search(activePages.cbegin(), activePages.cend(), pageIndex))
|
|
{
|
|
// We do not remove active page
|
|
continue;
|
|
}
|
|
|
|
const PDFPrecompiledPage* page = m_cache->object(pageIndex);
|
|
if (page && page->hasExpired(milisecondsLimit))
|
|
{
|
|
m_cache->remove(pageIndex);
|
|
}
|
|
}
|
|
}
|
|
|
|
void PDFAsynchronousPageCompiler::onPageCompiled()
|
|
{
|
|
std::vector<PDFInteger> compiledPages;
|
|
std::map<PDFInteger, PDFRenderError> errors;
|
|
|
|
{
|
|
QMutexLocker locker(&m_mutex);
|
|
|
|
// Search all tasks for finished tasks
|
|
for (auto it = m_tasks.begin(); it != m_tasks.end();)
|
|
{
|
|
CompileTask& task = it->second;
|
|
if (task.finished)
|
|
{
|
|
if (m_state == State::Active)
|
|
{
|
|
// If we are in active state, try to store precompiled page
|
|
PDFPrecompiledPage* page = new PDFPrecompiledPage(std::move(task.precompiledPage));
|
|
page->markAccessed();
|
|
qint64 memoryConsumptionEstimate = page->getMemoryConsumptionEstimate();
|
|
if (m_cache->insert(it->first, page, memoryConsumptionEstimate))
|
|
{
|
|
compiledPages.push_back(it->first);
|
|
}
|
|
else
|
|
{
|
|
// We can't insert page to the cache, because cache size is too small. We will
|
|
// emit error string to inform the user, that cache is too small.
|
|
QString message = PDFTranslationContext::tr("Precompiled page size is too high (%1 kB). Cache size is %2 kB. Increase the cache size!").arg(memoryConsumptionEstimate / 1024).arg(m_cache->maxCost() / 1024);
|
|
errors[it->first] = PDFRenderError(RenderErrorType::Error, message);
|
|
}
|
|
}
|
|
|
|
it = m_tasks.erase(it);
|
|
}
|
|
else
|
|
{
|
|
// Just increment the counter
|
|
++it;
|
|
}
|
|
}
|
|
}
|
|
|
|
for (const auto& error : errors)
|
|
{
|
|
Q_EMIT renderingError(error.first, { error.second });
|
|
}
|
|
|
|
if (!compiledPages.empty())
|
|
{
|
|
Q_ASSERT(std::is_sorted(compiledPages.cbegin(), compiledPages.cend()));
|
|
Q_EMIT pageImageChanged(false, compiledPages);
|
|
}
|
|
}
|
|
|
|
PDFAsynchronousTextLayoutCompiler::PDFAsynchronousTextLayoutCompiler(PDFDrawWidgetProxy* proxy) :
|
|
BaseClass(proxy),
|
|
m_proxy(proxy),
|
|
m_isRunning(false),
|
|
m_cache(std::bind(&PDFAsynchronousTextLayoutCompiler::createTextLayout, this, std::placeholders::_1))
|
|
{
|
|
connect(&m_textLayoutCompileFutureWatcher, &QFutureWatcher<PDFTextLayoutStorage>::finished, this, &PDFAsynchronousTextLayoutCompiler::onTextLayoutCreated);
|
|
}
|
|
|
|
void PDFAsynchronousTextLayoutCompiler::start()
|
|
{
|
|
switch (m_state)
|
|
{
|
|
case State::Inactive:
|
|
{
|
|
m_state = State::Active;
|
|
break;
|
|
}
|
|
|
|
case State::Active:
|
|
break; // We have nothing to do...
|
|
|
|
case State::Stopping:
|
|
{
|
|
// We shouldn't call this function while stopping!
|
|
Q_ASSERT(false);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
void PDFAsynchronousTextLayoutCompiler::stop(bool clearCache)
|
|
{
|
|
switch (m_state)
|
|
{
|
|
case State::Inactive:
|
|
break; // We have nothing to do...
|
|
|
|
case State::Active:
|
|
{
|
|
// Stop the engine
|
|
m_state = State::Stopping;
|
|
m_textLayoutCompileFutureWatcher.waitForFinished();
|
|
|
|
if (clearCache)
|
|
{
|
|
m_textLayouts = std::nullopt;
|
|
m_cache.clear();
|
|
}
|
|
|
|
m_state = State::Inactive;
|
|
break;
|
|
}
|
|
|
|
case State::Stopping:
|
|
{
|
|
// We shouldn't call this function while stopping!
|
|
Q_ASSERT(false);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
void PDFAsynchronousTextLayoutCompiler::reset()
|
|
{
|
|
stop(true);
|
|
start();
|
|
}
|
|
|
|
PDFTextLayout PDFAsynchronousTextLayoutCompiler::createTextLayout(PDFInteger pageIndex)
|
|
{
|
|
PDFTextLayout result;
|
|
|
|
if (isTextLayoutReady())
|
|
{
|
|
result = getTextLayout(pageIndex);
|
|
}
|
|
else
|
|
{
|
|
if (m_state != State::Active || !m_proxy->getDocument())
|
|
{
|
|
// Engine is not active, do not calculate layout
|
|
return result;
|
|
}
|
|
|
|
const PDFCatalog* catalog = m_proxy->getDocument()->getCatalog();
|
|
if (pageIndex < 0 || pageIndex >= PDFInteger(catalog->getPageCount()))
|
|
{
|
|
return result;
|
|
}
|
|
|
|
if (!catalog->getPage(pageIndex))
|
|
{
|
|
// Invalid page index
|
|
return result;
|
|
}
|
|
|
|
const PDFPage* page = catalog->getPage(pageIndex);
|
|
Q_ASSERT(page);
|
|
|
|
bool guard = false;
|
|
m_proxy->getFontCache()->setCacheShrinkEnabled(&guard, false);
|
|
|
|
PDFCMSPointer cms = m_proxy->getCMSManager()->getCurrentCMS();
|
|
PDFTextLayoutGenerator generator(m_proxy->getFeatures(), page, m_proxy->getDocument(), m_proxy->getFontCache(), cms.data(), m_proxy->getOptionalContentActivity(), QTransform(), m_proxy->getMeshQualitySettings());
|
|
generator.processContents();
|
|
result = generator.createTextLayout();
|
|
m_proxy->getFontCache()->setCacheShrinkEnabled(&guard, true);
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
PDFTextLayout PDFAsynchronousTextLayoutCompiler::getTextLayout(PDFInteger pageIndex)
|
|
{
|
|
if (m_state != State::Active || !m_proxy->getDocument())
|
|
{
|
|
// Engine is not active, always return empty layout
|
|
return PDFTextLayout();
|
|
}
|
|
|
|
if (m_textLayouts)
|
|
{
|
|
return m_textLayouts->getTextLayout(pageIndex);
|
|
}
|
|
|
|
return PDFTextLayout();
|
|
}
|
|
|
|
PDFTextLayoutGetter PDFAsynchronousTextLayoutCompiler::getTextLayoutLazy(PDFInteger pageIndex)
|
|
{
|
|
return PDFTextLayoutGetter(&m_cache, pageIndex);
|
|
}
|
|
|
|
PDFTextSelection PDFAsynchronousTextLayoutCompiler::getTextSelectionAll(QColor color) const
|
|
{
|
|
PDFTextSelection result;
|
|
|
|
if (m_textLayouts)
|
|
{
|
|
const PDFTextLayoutStorage& textLayouts = *m_textLayouts;
|
|
|
|
QMutex mutex;
|
|
PDFIntegerRange<size_t> pageRange(0, textLayouts.getCount());
|
|
auto selectPageText = [&mutex, &textLayouts, &result, color](PDFInteger pageIndex)
|
|
{
|
|
PDFTextLayout textLayout = textLayouts.getTextLayout(pageIndex);
|
|
PDFTextSelectionItems items;
|
|
|
|
const PDFTextBlocks& blocks = textLayout.getTextBlocks();
|
|
for (size_t blockId = 0, blockCount = blocks.size(); blockId < blockCount; ++blockId)
|
|
{
|
|
const PDFTextBlock& block = blocks[blockId];
|
|
const PDFTextLines& lines = block.getLines();
|
|
|
|
if (!lines.empty())
|
|
{
|
|
const PDFTextLine& lastLine = lines.back();
|
|
Q_ASSERT(!lastLine.getCharacters().empty());
|
|
|
|
PDFCharacterPointer ptrStart;
|
|
ptrStart.pageIndex = pageIndex;
|
|
ptrStart.blockIndex = blockId;
|
|
ptrStart.lineIndex = 0;
|
|
ptrStart.characterIndex = 0;
|
|
|
|
PDFCharacterPointer ptrEnd;
|
|
ptrEnd.pageIndex = pageIndex;
|
|
ptrEnd.blockIndex = blockId;
|
|
ptrEnd.lineIndex = lines.size() - 1;
|
|
ptrEnd.characterIndex = lastLine.getCharacters().size() - 1;
|
|
|
|
items.emplace_back(ptrStart, ptrEnd);
|
|
}
|
|
}
|
|
|
|
QMutexLocker lock(&mutex);
|
|
result.addItems(qMove(items), color);
|
|
};
|
|
PDFExecutionPolicy::execute(PDFExecutionPolicy::Scope::Page, pageRange.begin(), pageRange.end(), selectPageText);
|
|
}
|
|
|
|
result.build();
|
|
return result;
|
|
}
|
|
|
|
void PDFAsynchronousTextLayoutCompiler::makeTextLayout()
|
|
{
|
|
if (m_state != State::Active || !m_proxy->getDocument())
|
|
{
|
|
// Engine is not active, do not calculate layout
|
|
return;
|
|
}
|
|
|
|
if (m_textLayouts.has_value())
|
|
{
|
|
// Value is computed already
|
|
return;
|
|
}
|
|
|
|
if (m_isRunning)
|
|
{
|
|
// Text layout is already being processed
|
|
return;
|
|
}
|
|
|
|
// Jakub Melka: Mark, that we are running (test for future is not enough,
|
|
// because future can finish before this function exits, for example)
|
|
m_isRunning = true;
|
|
|
|
ProgressStartupInfo info;
|
|
info.showDialog = false;
|
|
info.text = tr("Indexing document contents...");
|
|
|
|
m_proxy->getFontCache()->setCacheShrinkEnabled(this, false);
|
|
const PDFCatalog* catalog = m_proxy->getDocument()->getCatalog();
|
|
m_proxy->getProgress()->start(catalog->getPageCount(), qMove(info));
|
|
|
|
PDFCMSPointer cms = m_proxy->getCMSManager()->getCurrentCMS();
|
|
|
|
auto createTextLayout = [this, cms, catalog]() -> PDFTextLayoutStorage
|
|
{
|
|
PDFTextLayoutStorage result(catalog->getPageCount());
|
|
QMutex mutex;
|
|
auto generateTextLayout = [this, &result, &mutex, cms, catalog](PDFInteger pageIndex)
|
|
{
|
|
if (!catalog->getPage(pageIndex))
|
|
{
|
|
// Invalid page index
|
|
result.setTextLayout(pageIndex, PDFTextLayout(), &mutex);
|
|
return;
|
|
}
|
|
|
|
const PDFPage* page = catalog->getPage(pageIndex);
|
|
Q_ASSERT(page);
|
|
|
|
PDFTextLayoutGenerator generator(m_proxy->getFeatures(), page, m_proxy->getDocument(), m_proxy->getFontCache(), cms.data(), m_proxy->getOptionalContentActivity(), QTransform(), m_proxy->getMeshQualitySettings());
|
|
generator.processContents();
|
|
result.setTextLayout(pageIndex, generator.createTextLayout(), &mutex);
|
|
m_proxy->getProgress()->step();
|
|
};
|
|
|
|
auto pageRange = PDFIntegerRange<PDFInteger>(0, catalog->getPageCount());
|
|
PDFExecutionPolicy::execute(PDFExecutionPolicy::Scope::Page, pageRange.begin(), pageRange.end(), generateTextLayout);
|
|
return result;
|
|
};
|
|
|
|
Q_ASSERT(!m_textLayoutCompileFuture.isRunning());
|
|
m_textLayoutCompileFuture = QtConcurrent::run(createTextLayout);
|
|
m_textLayoutCompileFutureWatcher.setFuture(m_textLayoutCompileFuture);
|
|
}
|
|
|
|
void PDFAsynchronousTextLayoutCompiler::onTextLayoutCreated()
|
|
{
|
|
m_proxy->getFontCache()->setCacheShrinkEnabled(this, true);
|
|
m_proxy->getProgress()->finish();
|
|
m_cache.clear();
|
|
|
|
m_textLayouts = m_textLayoutCompileFuture.result();
|
|
m_isRunning = false;
|
|
Q_EMIT textLayoutChanged();
|
|
}
|
|
|
|
} // namespace pdf
|