mirror of https://github.com/JakubMelka/PDF4QT.git
283 lines
8.6 KiB
C++
283 lines
8.6 KiB
C++
// Copyright (C) 2018-2023 Jakub Melka
|
|
//
|
|
// This file is part of PDF4QT.
|
|
//
|
|
// PDF4QT is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU Lesser General Public License as published by
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
// with the written consent of the copyright owner, any later version.
|
|
//
|
|
// PDF4QT is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU Lesser General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Lesser General Public License
|
|
// along with PDF4QT. If not, see <https://www.gnu.org/licenses/>.
|
|
|
|
|
|
#include "pdfvisitor.h"
|
|
#include "pdfdbgheap.h"
|
|
|
|
namespace pdf
|
|
{
|
|
|
|
void PDFAbstractVisitor::acceptArray(const PDFArray* array)
|
|
{
|
|
Q_ASSERT(array);
|
|
|
|
for (size_t i = 0, count = array->getCount(); i < count; ++i)
|
|
{
|
|
array->getItem(i).accept(this);
|
|
}
|
|
}
|
|
|
|
void PDFAbstractVisitor::acceptDictionary(const PDFDictionary* dictionary)
|
|
{
|
|
Q_ASSERT(dictionary);
|
|
|
|
for (size_t i = 0, count = dictionary->getCount(); i < count; ++i)
|
|
{
|
|
dictionary->getValue(i).accept(this);
|
|
}
|
|
}
|
|
|
|
void PDFAbstractVisitor::acceptStream(const PDFStream* stream)
|
|
{
|
|
Q_ASSERT(stream);
|
|
|
|
acceptDictionary(stream->getDictionary());
|
|
}
|
|
|
|
PDFStatisticsCollector::PDFStatisticsCollector()
|
|
{
|
|
|
|
}
|
|
|
|
void PDFStatisticsCollector::visitNull()
|
|
{
|
|
collectStatisticsOfSimpleObject(PDFObject::Type::Null);
|
|
}
|
|
|
|
void PDFStatisticsCollector::visitBool(bool value)
|
|
{
|
|
Q_UNUSED(value);
|
|
collectStatisticsOfSimpleObject(PDFObject::Type::Bool);
|
|
}
|
|
|
|
void PDFStatisticsCollector::visitInt(PDFInteger value)
|
|
{
|
|
Q_UNUSED(value);
|
|
collectStatisticsOfSimpleObject(PDFObject::Type::Int);
|
|
}
|
|
|
|
void PDFStatisticsCollector::visitReal(PDFReal value)
|
|
{
|
|
Q_UNUSED(value);
|
|
collectStatisticsOfSimpleObject(PDFObject::Type::Real);
|
|
}
|
|
|
|
void PDFStatisticsCollector::visitString(PDFStringRef string)
|
|
{
|
|
Statistics& statistics = m_statistics[size_t(PDFObject::Type::String)];
|
|
if (string.inplaceString)
|
|
{
|
|
collectStatisticsOfSimpleObject(PDFObject::Type::String);
|
|
}
|
|
else
|
|
{
|
|
collectStatisticsOfString(string.memoryString, statistics);
|
|
}
|
|
}
|
|
|
|
void PDFStatisticsCollector::visitName(PDFStringRef name)
|
|
{
|
|
Statistics& statistics = m_statistics[size_t(PDFObject::Type::Name)];
|
|
if (name.inplaceString)
|
|
{
|
|
collectStatisticsOfSimpleObject(PDFObject::Type::Name);
|
|
}
|
|
else
|
|
{
|
|
collectStatisticsOfString(name.memoryString, statistics);
|
|
}
|
|
}
|
|
|
|
void PDFStatisticsCollector::visitArray(const PDFArray* array)
|
|
{
|
|
Statistics& statistics = m_statistics[size_t(PDFObject::Type::Array)];
|
|
statistics.count += 1;
|
|
statistics.memoryConsumptionEstimate += sizeof(PDFObject) + sizeof(PDFArray);
|
|
|
|
// We process elements of the array, together with memory consumption,
|
|
// in the call of acceptArray function. No need to calculate memory consumption here.
|
|
// Just calculate the overhead.
|
|
statistics.memoryOverheadEstimate += (array->getCapacity() - array->getCount()) * sizeof(PDFObject);
|
|
|
|
acceptArray(array);
|
|
}
|
|
|
|
void PDFStatisticsCollector::visitDictionary(const PDFDictionary* dictionary)
|
|
{
|
|
Statistics& statistics = m_statistics[size_t(PDFObject::Type::Dictionary)];
|
|
collectStatisticsOfDictionary(statistics, dictionary);
|
|
|
|
acceptDictionary(dictionary);
|
|
}
|
|
|
|
void PDFStatisticsCollector::visitStream(const PDFStream* stream)
|
|
{
|
|
Statistics& statistics = m_statistics[size_t(PDFObject::Type::Stream)];
|
|
collectStatisticsOfDictionary(statistics, stream->getDictionary());
|
|
|
|
const QByteArray& byteArray = *stream->getContent();
|
|
const uint64_t memoryConsumption = byteArray.size() * sizeof(char);
|
|
const uint64_t memoryOverhead = (byteArray.capacity() - byteArray.size()) * sizeof(char);
|
|
|
|
statistics.memoryConsumptionEstimate += memoryConsumption;
|
|
statistics.memoryOverheadEstimate += memoryOverhead;
|
|
|
|
acceptStream(stream);
|
|
}
|
|
|
|
void PDFStatisticsCollector::visitReference(const PDFObjectReference reference)
|
|
{
|
|
Q_UNUSED(reference);
|
|
collectStatisticsOfSimpleObject(PDFObject::Type::Reference);
|
|
}
|
|
|
|
void PDFStatisticsCollector::collectStatisticsOfDictionary(Statistics& statistics, const PDFDictionary* dictionary)
|
|
{
|
|
statistics.count += 1;
|
|
statistics.memoryConsumptionEstimate += sizeof(PDFObject) + sizeof(PDFDictionary);
|
|
|
|
constexpr uint64_t sizeOfItem = sizeof(std::pair<QByteArray, PDFObject>);
|
|
constexpr uint64_t sizeOfItemWithoutObject = sizeOfItem - sizeof(PDFObject);
|
|
|
|
uint64_t consumptionEstimate = sizeOfItemWithoutObject * dictionary->getCount();
|
|
uint64_t overheadEstimate = sizeOfItem * (dictionary->getCapacity() - dictionary->getCount());
|
|
|
|
for (size_t i = 0, count = dictionary->getCount(); i < count; ++i)
|
|
{
|
|
if (!dictionary->getKey(i).isInplace())
|
|
{
|
|
QByteArray key = dictionary->getKey(i).getString();
|
|
|
|
consumptionEstimate += key.size() * sizeof(char);
|
|
overheadEstimate += (key.capacity() - key.size()) * sizeof(char);
|
|
}
|
|
}
|
|
|
|
statistics.memoryConsumptionEstimate += consumptionEstimate;
|
|
statistics.memoryOverheadEstimate += overheadEstimate;
|
|
}
|
|
|
|
void PDFStatisticsCollector::collectStatisticsOfString(const PDFString* string, Statistics& statistics)
|
|
{
|
|
statistics.count += 1;
|
|
statistics.memoryConsumptionEstimate += sizeof(PDFObject) + sizeof(PDFString);
|
|
|
|
const QByteArray& byteArray = string->getString();
|
|
const uint64_t memoryConsumption = byteArray.size() * sizeof(char);
|
|
const uint64_t memoryOverhead = (byteArray.capacity() - byteArray.size()) * sizeof(char);
|
|
|
|
statistics.memoryConsumptionEstimate += memoryConsumption;
|
|
statistics.memoryOverheadEstimate += memoryOverhead;
|
|
}
|
|
|
|
void PDFStatisticsCollector::collectStatisticsOfSimpleObject(PDFObject::Type type)
|
|
{
|
|
Statistics& statistics = m_statistics[size_t(type)];
|
|
statistics.count += 1;
|
|
statistics.memoryConsumptionEstimate += sizeof(PDFObject);
|
|
}
|
|
|
|
void PDFUpdateObjectVisitor::visitNull()
|
|
{
|
|
m_objectStack.push_back(PDFObject::createNull());
|
|
}
|
|
|
|
void PDFUpdateObjectVisitor::visitBool(bool value)
|
|
{
|
|
m_objectStack.push_back(PDFObject::createBool(value));
|
|
}
|
|
|
|
void PDFUpdateObjectVisitor::visitInt(PDFInteger value)
|
|
{
|
|
m_objectStack.push_back(PDFObject::createInteger(value));
|
|
}
|
|
|
|
void PDFUpdateObjectVisitor::visitReal(PDFReal value)
|
|
{
|
|
m_objectStack.push_back(PDFObject::createReal(value));
|
|
}
|
|
|
|
void PDFUpdateObjectVisitor::visitString(PDFStringRef string)
|
|
{
|
|
m_objectStack.push_back(PDFObject::createString(string));
|
|
}
|
|
|
|
void PDFUpdateObjectVisitor::visitName(PDFStringRef name)
|
|
{
|
|
m_objectStack.push_back(PDFObject::createName(name));
|
|
}
|
|
|
|
void PDFUpdateObjectVisitor::visitArray(const PDFArray* array)
|
|
{
|
|
acceptArray(array);
|
|
|
|
// We have all objects on the stack
|
|
Q_ASSERT(array->getCount() <= m_objectStack.size());
|
|
|
|
auto it = std::next(m_objectStack.cbegin(), m_objectStack.size() - array->getCount());
|
|
std::vector<PDFObject> objects(it, m_objectStack.cend());
|
|
PDFObject object = PDFObject::createArray(std::make_shared<PDFArray>(qMove(objects)));
|
|
m_objectStack.erase(it, m_objectStack.cend());
|
|
m_objectStack.push_back(object);
|
|
}
|
|
|
|
void PDFUpdateObjectVisitor::visitDictionary(const PDFDictionary* dictionary)
|
|
{
|
|
Q_ASSERT(dictionary);
|
|
|
|
std::vector<PDFDictionary::DictionaryEntry> entries;
|
|
entries.reserve(dictionary->getCount());
|
|
|
|
for (size_t i = 0, count = dictionary->getCount(); i < count; ++i)
|
|
{
|
|
dictionary->getValue(i).accept(this);
|
|
Q_ASSERT(!m_objectStack.empty());
|
|
entries.emplace_back(dictionary->getKey(i), m_objectStack.back());
|
|
m_objectStack.pop_back();
|
|
}
|
|
|
|
m_objectStack.push_back(PDFObject::createDictionary(std::make_shared<PDFDictionary>(qMove(entries))));
|
|
}
|
|
|
|
void PDFUpdateObjectVisitor::visitStream(const PDFStream* stream)
|
|
{
|
|
const PDFDictionary* dictionary = stream->getDictionary();
|
|
|
|
visitDictionary(dictionary);
|
|
|
|
Q_ASSERT(!m_objectStack.empty());
|
|
PDFObject dictionaryObject = m_objectStack.back();
|
|
m_objectStack.pop_back();
|
|
|
|
PDFDictionary newDictionary(*dictionaryObject.getDictionary());
|
|
m_objectStack.push_back(PDFObject::createStream(std::make_shared<PDFStream>(qMove(newDictionary), QByteArray(*stream->getContent()))));
|
|
}
|
|
|
|
void PDFUpdateObjectVisitor::visitReference(const PDFObjectReference reference)
|
|
{
|
|
m_objectStack.push_back(PDFObject::createReference(reference));
|
|
}
|
|
|
|
PDFObject PDFUpdateObjectVisitor::getObject()
|
|
{
|
|
Q_ASSERT(m_objectStack.size() == 1);
|
|
return qMove(m_objectStack.back());
|
|
}
|
|
|
|
} // namespace pdf
|