2020-01-18 11:38:54 +01:00
|
|
|
// Copyright (C) 2019-2020 Jakub Melka
|
2019-03-25 18:44:45 +01:00
|
|
|
//
|
2020-12-20 19:03:58 +01:00
|
|
|
// This file is part of Pdf4Qt.
|
2019-03-25 18:44:45 +01:00
|
|
|
//
|
2020-12-20 19:03:58 +01:00
|
|
|
// Pdf4Qt is free software: you can redistribute it and/or modify
|
2019-03-25 18:44:45 +01:00
|
|
|
// it under the terms of the GNU Lesser General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
2020-12-20 19:03:58 +01:00
|
|
|
// Pdf4Qt is distributed in the hope that it will be useful,
|
2019-03-25 18:44:45 +01:00
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Lesser General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Lesser General Public License
|
2020-12-20 19:03:58 +01:00
|
|
|
// along with Pdf4Qt. If not, see <https://www.gnu.org/licenses/>.
|
2019-03-25 18:44:45 +01:00
|
|
|
|
|
|
|
#ifndef PDFFONT_H
|
|
|
|
#define PDFFONT_H
|
|
|
|
|
|
|
|
#include "pdfglobal.h"
|
2019-03-30 18:45:30 +01:00
|
|
|
#include "pdfencoding.h"
|
|
|
|
#include "pdfobject.h"
|
2019-03-25 18:44:45 +01:00
|
|
|
|
2019-04-16 19:59:10 +02:00
|
|
|
#include <QFont>
|
2019-07-14 19:03:15 +02:00
|
|
|
#include <QMatrix>
|
2019-03-25 18:44:45 +01:00
|
|
|
#include <QSharedPointer>
|
|
|
|
|
2020-01-01 18:23:18 +01:00
|
|
|
#include <set>
|
2019-04-30 18:38:27 +02:00
|
|
|
#include <unordered_map>
|
|
|
|
|
2019-04-16 19:59:10 +02:00
|
|
|
class QPainterPath;
|
2020-10-24 14:39:09 +02:00
|
|
|
class QTreeWidgetItem;
|
2019-04-16 19:59:10 +02:00
|
|
|
|
2019-03-25 18:44:45 +01:00
|
|
|
namespace pdf
|
|
|
|
{
|
2019-03-30 18:45:30 +01:00
|
|
|
class PDFDocument;
|
2020-04-25 14:21:06 +02:00
|
|
|
class PDFModifiedDocument;
|
2019-04-30 14:39:48 +02:00
|
|
|
class PDFRenderErrorReporter;
|
2020-10-24 14:39:09 +02:00
|
|
|
class PDFFontCMap;
|
2019-03-25 18:44:45 +01:00
|
|
|
|
2019-04-27 14:14:07 +02:00
|
|
|
using CID = unsigned int;
|
|
|
|
using GID = unsigned int;
|
|
|
|
|
|
|
|
using GlyphIndices = std::array<GID, 256>;
|
2019-04-19 17:42:58 +02:00
|
|
|
|
2019-03-25 18:44:45 +01:00
|
|
|
enum class TextRenderingMode
|
|
|
|
{
|
|
|
|
Fill = 0,
|
|
|
|
Stroke = 1,
|
|
|
|
FillStroke = 2,
|
|
|
|
Invisible = 3,
|
|
|
|
FillClip = 4,
|
|
|
|
StrokeClip = 5,
|
|
|
|
FillStrokeClip = 6,
|
|
|
|
Clip = 7
|
|
|
|
};
|
|
|
|
|
2019-04-07 19:39:29 +02:00
|
|
|
/// Item of the text sequence (either single character, or advance)
|
|
|
|
struct TextSequenceItem
|
|
|
|
{
|
|
|
|
inline explicit TextSequenceItem() = default;
|
|
|
|
inline explicit TextSequenceItem(const QPainterPath* glyph, QChar character, PDFReal advance) : glyph(glyph), character(character), advance(advance) { }
|
|
|
|
inline explicit TextSequenceItem(PDFReal advance) : character(), advance(advance) { }
|
2020-08-21 16:37:57 +02:00
|
|
|
inline explicit TextSequenceItem(const QByteArray* characterContentStream, QChar character, PDFReal advance) : characterContentStream(characterContentStream), character(character), advance(advance) { }
|
2019-04-07 19:39:29 +02:00
|
|
|
|
2019-07-14 19:03:15 +02:00
|
|
|
inline bool isContentStream() const { return characterContentStream; }
|
2019-04-27 14:14:07 +02:00
|
|
|
inline bool isCharacter() const { return glyph; }
|
2019-04-07 19:39:29 +02:00
|
|
|
inline bool isAdvance() const { return advance != 0.0; }
|
|
|
|
inline bool isNull() const { return !isCharacter() && !isAdvance(); }
|
|
|
|
|
|
|
|
const QPainterPath* glyph = nullptr;
|
2019-07-14 19:03:15 +02:00
|
|
|
const QByteArray* characterContentStream = nullptr;
|
2019-04-07 19:39:29 +02:00
|
|
|
QChar character;
|
|
|
|
PDFReal advance = 0;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct TextSequence
|
|
|
|
{
|
|
|
|
std::vector<TextSequenceItem> items;
|
|
|
|
};
|
|
|
|
|
2019-03-25 18:44:45 +01:00
|
|
|
constexpr bool isTextRenderingModeFilled(TextRenderingMode mode)
|
|
|
|
{
|
|
|
|
switch (mode)
|
|
|
|
{
|
|
|
|
case TextRenderingMode::Fill:
|
|
|
|
case TextRenderingMode::FillClip:
|
|
|
|
case TextRenderingMode::FillStroke:
|
|
|
|
case TextRenderingMode::FillStrokeClip:
|
|
|
|
return true;
|
|
|
|
|
|
|
|
default:
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
constexpr bool isTextRenderingModeStroked(TextRenderingMode mode)
|
|
|
|
{
|
|
|
|
switch (mode)
|
|
|
|
{
|
|
|
|
case TextRenderingMode::Stroke:
|
|
|
|
case TextRenderingMode::FillStroke:
|
|
|
|
case TextRenderingMode::StrokeClip:
|
|
|
|
case TextRenderingMode::FillStrokeClip:
|
|
|
|
return true;
|
|
|
|
|
|
|
|
default:
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
constexpr bool isTextRenderingModeClipped(TextRenderingMode mode)
|
|
|
|
{
|
|
|
|
switch (mode)
|
|
|
|
{
|
|
|
|
case TextRenderingMode::Clip:
|
|
|
|
case TextRenderingMode::FillClip:
|
|
|
|
case TextRenderingMode::StrokeClip:
|
|
|
|
case TextRenderingMode::FillStrokeClip:
|
|
|
|
return true;
|
|
|
|
|
|
|
|
default:
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-03-30 18:45:30 +01:00
|
|
|
enum class FontType
|
|
|
|
{
|
|
|
|
Invalid,
|
2019-04-27 14:14:07 +02:00
|
|
|
Type0,
|
2019-03-30 18:45:30 +01:00
|
|
|
Type1,
|
2020-08-18 19:39:09 +02:00
|
|
|
MMType1,
|
2019-07-14 19:03:15 +02:00
|
|
|
TrueType,
|
|
|
|
Type3
|
2019-03-30 18:45:30 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
/// Standard Type1 fonts
|
|
|
|
enum class StandardFontType
|
|
|
|
{
|
|
|
|
Invalid,
|
|
|
|
TimesRoman,
|
|
|
|
TimesRomanBold,
|
|
|
|
TimesRomanItalics,
|
|
|
|
TimesRomanBoldItalics,
|
|
|
|
Helvetica,
|
|
|
|
HelveticaBold,
|
|
|
|
HelveticaOblique,
|
|
|
|
HelveticaBoldOblique,
|
|
|
|
Courier,
|
|
|
|
CourierBold,
|
|
|
|
CourierOblique,
|
|
|
|
CourierBoldOblique,
|
|
|
|
Symbol,
|
|
|
|
ZapfDingbats
|
|
|
|
};
|
|
|
|
|
|
|
|
/// Returns builtin encoding for the standard font
|
|
|
|
static constexpr PDFEncoding::Encoding getEncodingForStandardFont(StandardFontType standardFont)
|
|
|
|
{
|
|
|
|
switch (standardFont)
|
|
|
|
{
|
|
|
|
case StandardFontType::Symbol:
|
|
|
|
return PDFEncoding::Encoding::Symbol;
|
|
|
|
|
|
|
|
case StandardFontType::ZapfDingbats:
|
|
|
|
return PDFEncoding::Encoding::ZapfDingbats;
|
|
|
|
|
|
|
|
default:
|
|
|
|
return PDFEncoding::Encoding::Standard;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-12-20 19:03:58 +01:00
|
|
|
struct Pdf4QtLIBSHARED_EXPORT FontDescriptor
|
2019-03-31 18:08:36 +02:00
|
|
|
{
|
|
|
|
bool isEmbedded() const { return !fontFile.isEmpty() || !fontFile2.isEmpty() || !fontFile3.isEmpty(); }
|
|
|
|
|
2019-04-16 19:59:10 +02:00
|
|
|
/// Returns embedded font data, or nullptr, if font is not embedded
|
|
|
|
const QByteArray* getEmbeddedFontData() const;
|
|
|
|
|
2019-03-31 18:08:36 +02:00
|
|
|
QByteArray fontName;
|
|
|
|
QByteArray fontFamily;
|
|
|
|
QFont::Stretch fontStretch = QFont::AnyStretch;
|
|
|
|
PDFReal fontWeight = 400.0;
|
|
|
|
PDFInteger flags;
|
|
|
|
QRectF boundingBox;
|
|
|
|
PDFReal italicAngle = 0.0;
|
|
|
|
PDFReal ascent = 0.0;
|
|
|
|
PDFReal descent = 0.0;
|
|
|
|
PDFReal leading = 0.0;
|
|
|
|
PDFReal capHeight = 0.0;
|
|
|
|
PDFReal xHeight = 0.0;
|
|
|
|
PDFReal stemV = 0.0;
|
|
|
|
PDFReal stemH = 0.0;
|
|
|
|
PDFReal avgWidth = 0.0;
|
|
|
|
PDFReal maxWidth = 0.0;
|
|
|
|
PDFReal missingWidth = 0.0;
|
|
|
|
|
|
|
|
/// Byte array with Type 1 font program (embedded font)
|
|
|
|
QByteArray fontFile;
|
|
|
|
|
|
|
|
/// Byte array with TrueType font program (embedded font)
|
|
|
|
QByteArray fontFile2;
|
|
|
|
|
|
|
|
/// Byte array with font program, whose format is defined by the Subtype array
|
|
|
|
/// in the font dictionary.
|
|
|
|
QByteArray fontFile3;
|
|
|
|
|
|
|
|
/// Character set
|
|
|
|
QByteArray charset;
|
|
|
|
};
|
|
|
|
|
2019-03-30 18:45:30 +01:00
|
|
|
class PDFFont;
|
|
|
|
|
|
|
|
using PDFFontPointer = QSharedPointer<PDFFont>;
|
|
|
|
|
2019-04-07 19:39:29 +02:00
|
|
|
class PDFRealizedFont;
|
2019-07-14 19:03:15 +02:00
|
|
|
class IRealizedFontImpl;
|
2019-04-07 19:39:29 +02:00
|
|
|
|
|
|
|
using PDFRealizedFontPointer = QSharedPointer<PDFRealizedFont>;
|
|
|
|
|
2020-10-25 13:51:57 +01:00
|
|
|
struct CharacterInfo
|
|
|
|
{
|
|
|
|
GID gid = 0;
|
|
|
|
QChar character;
|
|
|
|
};
|
|
|
|
using CharacterInfos = std::vector<CharacterInfo>;
|
|
|
|
|
2019-04-07 19:39:29 +02:00
|
|
|
/// Font, which has fixed pixel size. It is programmed as PIMPL, because we need
|
|
|
|
/// to remove FreeType types from the interface (so we do not include FreeType in the interface).
|
2020-12-20 19:03:58 +01:00
|
|
|
class Pdf4QtLIBSHARED_EXPORT PDFRealizedFont
|
2019-04-07 19:39:29 +02:00
|
|
|
{
|
|
|
|
public:
|
|
|
|
~PDFRealizedFont();
|
|
|
|
|
|
|
|
/// Fills the text sequence by interpreting byte array according font data and
|
|
|
|
/// produces glyphs for the font.
|
|
|
|
/// \param byteArray Array of bytes to be interpreted
|
|
|
|
/// \param textSequence Text sequence to be filled
|
2019-04-30 14:39:48 +02:00
|
|
|
/// \param reporter Error reporter
|
|
|
|
void fillTextSequence(const QByteArray& byteArray, TextSequence& textSequence, PDFRenderErrorReporter* reporter);
|
2019-04-07 19:39:29 +02:00
|
|
|
|
|
|
|
/// Return true, if we have horizontal writing system
|
|
|
|
bool isHorizontalWritingSystem() const;
|
|
|
|
|
2019-12-21 18:10:54 +01:00
|
|
|
/// Adds information about the font into tree item
|
|
|
|
void dumpFontToTreeItem(QTreeWidgetItem* item) const;
|
|
|
|
|
2020-10-24 15:36:00 +02:00
|
|
|
/// Returns postscript name of the font
|
|
|
|
QString getPostScriptName() const;
|
|
|
|
|
2020-10-25 13:51:57 +01:00
|
|
|
/// Returns character info
|
|
|
|
CharacterInfos getCharacterInfos() const;
|
|
|
|
|
2019-04-07 19:39:29 +02:00
|
|
|
/// Creates new realized font from the standard font. If font can't be created,
|
|
|
|
/// then exception is thrown.
|
2019-10-02 19:37:19 +02:00
|
|
|
static PDFRealizedFontPointer createRealizedFont(PDFFontPointer font, PDFReal pixelSize, PDFRenderErrorReporter* reporter);
|
2019-04-07 19:39:29 +02:00
|
|
|
|
|
|
|
private:
|
|
|
|
/// Constructs new realized font
|
2019-07-14 19:03:15 +02:00
|
|
|
explicit PDFRealizedFont(IRealizedFontImpl* impl) : m_impl(impl) { }
|
2019-04-07 19:39:29 +02:00
|
|
|
|
2019-07-14 19:03:15 +02:00
|
|
|
IRealizedFontImpl* m_impl;
|
2019-04-07 19:39:29 +02:00
|
|
|
};
|
|
|
|
|
2019-03-30 18:45:30 +01:00
|
|
|
/// Base class representing font in the PDF file
|
2020-12-20 19:03:58 +01:00
|
|
|
class Pdf4QtLIBSHARED_EXPORT PDFFont
|
2019-03-25 18:44:45 +01:00
|
|
|
{
|
|
|
|
public:
|
2019-03-31 18:08:36 +02:00
|
|
|
explicit PDFFont(FontDescriptor fontDescriptor);
|
2019-03-30 18:45:30 +01:00
|
|
|
virtual ~PDFFont() = default;
|
|
|
|
|
|
|
|
/// Returns the font type
|
|
|
|
virtual FontType getFontType() const = 0;
|
|
|
|
|
2020-10-24 14:39:09 +02:00
|
|
|
/// Returns ToUnicode mapping (or nullptr, if font has no mapping to unicode)
|
|
|
|
virtual const PDFFontCMap* getToUnicode() const { return nullptr; }
|
|
|
|
|
2019-03-31 18:08:36 +02:00
|
|
|
/// Returns font descriptor
|
|
|
|
const FontDescriptor* getFontDescriptor() const { return &m_fontDescriptor; }
|
|
|
|
|
2019-12-21 18:10:54 +01:00
|
|
|
/// Adds information about the font into tree item
|
|
|
|
virtual void dumpFontToTreeItem(QTreeWidgetItem* item) const { Q_UNUSED(item); }
|
|
|
|
|
2019-03-31 18:08:36 +02:00
|
|
|
/// Creates font from the object. If font can't be created, exception is thrown.
|
|
|
|
/// \param object Font dictionary
|
|
|
|
/// \param document Document
|
2019-03-30 18:45:30 +01:00
|
|
|
static PDFFontPointer createFont(const PDFObject& object, const PDFDocument* document);
|
2019-03-31 18:08:36 +02:00
|
|
|
|
|
|
|
protected:
|
|
|
|
FontDescriptor m_fontDescriptor;
|
2019-04-27 14:14:07 +02:00
|
|
|
|
|
|
|
private:
|
|
|
|
/// Tries to read font descriptor from the object
|
|
|
|
/// \param fontDescriptorObject Font descriptor dictionary
|
|
|
|
/// \param document Document
|
|
|
|
static FontDescriptor readFontDescriptor(const PDFObject& fontDescriptorObject, const PDFDocument* document);
|
2019-03-25 18:44:45 +01:00
|
|
|
};
|
|
|
|
|
2019-03-30 18:45:30 +01:00
|
|
|
/// Simple font, see PDF reference 1.7, chapter 5.5. Simple fonts have encoding table,
|
|
|
|
/// which maps single-byte character to the glyph in the font.
|
|
|
|
class PDFSimpleFont : public PDFFont
|
|
|
|
{
|
2019-12-21 18:10:54 +01:00
|
|
|
using BaseClass = PDFFont;
|
|
|
|
|
2019-03-30 18:45:30 +01:00
|
|
|
public:
|
2019-03-31 18:08:36 +02:00
|
|
|
explicit PDFSimpleFont(FontDescriptor fontDescriptor,
|
|
|
|
QByteArray name,
|
2019-03-30 18:45:30 +01:00
|
|
|
QByteArray baseFont,
|
|
|
|
PDFInteger firstChar,
|
|
|
|
PDFInteger lastChar,
|
|
|
|
std::vector<PDFInteger> widths,
|
|
|
|
PDFEncoding::Encoding encodingType,
|
2019-04-19 17:42:58 +02:00
|
|
|
encoding::EncodingTable encoding,
|
|
|
|
GlyphIndices glyphIndices);
|
2019-03-30 18:45:30 +01:00
|
|
|
virtual ~PDFSimpleFont() override = default;
|
|
|
|
|
2020-10-24 14:39:09 +02:00
|
|
|
const PDFEncoding::Encoding getEncodingType() const { return m_encodingType; }
|
2019-04-19 17:42:58 +02:00
|
|
|
const encoding::EncodingTable* getEncoding() const { return &m_encoding; }
|
|
|
|
const GlyphIndices* getGlyphIndices() const { return &m_glyphIndices; }
|
|
|
|
|
2019-04-30 18:38:27 +02:00
|
|
|
/// Returns the glyph advance (or zero, if glyph advance is invalid)
|
|
|
|
PDFInteger getGlyphAdvance(size_t index) const;
|
2019-04-30 14:39:48 +02:00
|
|
|
|
2019-12-21 18:10:54 +01:00
|
|
|
virtual void dumpFontToTreeItem(QTreeWidgetItem* item) const override;
|
|
|
|
|
2019-03-30 18:45:30 +01:00
|
|
|
protected:
|
|
|
|
QByteArray m_name;
|
|
|
|
QByteArray m_baseFont;
|
|
|
|
PDFInteger m_firstChar;
|
|
|
|
PDFInteger m_lastChar;
|
|
|
|
std::vector<PDFInteger> m_widths;
|
|
|
|
PDFEncoding::Encoding m_encodingType;
|
|
|
|
encoding::EncodingTable m_encoding;
|
2019-04-19 17:42:58 +02:00
|
|
|
GlyphIndices m_glyphIndices;
|
2019-03-30 18:45:30 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
class PDFType1Font : public PDFSimpleFont
|
|
|
|
{
|
2019-12-21 18:10:54 +01:00
|
|
|
using BaseClass = PDFSimpleFont;
|
|
|
|
|
2019-03-30 18:45:30 +01:00
|
|
|
public:
|
2020-08-18 19:39:09 +02:00
|
|
|
explicit PDFType1Font(FontType fontType,
|
|
|
|
FontDescriptor fontDescriptor,
|
2019-03-31 18:08:36 +02:00
|
|
|
QByteArray name,
|
2019-03-30 18:45:30 +01:00
|
|
|
QByteArray baseFont,
|
|
|
|
PDFInteger firstChar,
|
|
|
|
PDFInteger lastChar,
|
|
|
|
std::vector<PDFInteger> widths,
|
|
|
|
PDFEncoding::Encoding encodingType,
|
|
|
|
encoding::EncodingTable encoding,
|
2019-04-19 17:42:58 +02:00
|
|
|
StandardFontType standardFontType,
|
|
|
|
GlyphIndices glyphIndices);
|
2019-03-30 18:45:30 +01:00
|
|
|
virtual ~PDFType1Font() override = default;
|
|
|
|
|
|
|
|
virtual FontType getFontType() const override;
|
2019-12-21 18:10:54 +01:00
|
|
|
virtual void dumpFontToTreeItem(QTreeWidgetItem*item) const override;
|
2019-03-30 18:45:30 +01:00
|
|
|
|
|
|
|
/// Returns the assigned standard font (or invalid, if font is not standard)
|
|
|
|
StandardFontType getStandardFontType() const { return m_standardFontType; }
|
|
|
|
|
|
|
|
private:
|
2020-08-18 19:39:09 +02:00
|
|
|
FontType m_fontType;
|
2019-03-30 18:45:30 +01:00
|
|
|
StandardFontType m_standardFontType; ///< Type of the standard font (or invalid, if it is not a standard font)
|
|
|
|
};
|
|
|
|
|
|
|
|
class PDFTrueTypeFont : public PDFSimpleFont
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
using PDFSimpleFont::PDFSimpleFont;
|
|
|
|
|
|
|
|
virtual FontType getFontType() const override;
|
|
|
|
};
|
2019-03-25 18:44:45 +01:00
|
|
|
|
2019-04-12 19:17:19 +02:00
|
|
|
/// Font cache which caches both fonts, and realized fonts. Cache has individual limit
|
|
|
|
/// for fonts, and realized fonts.
|
2020-12-20 19:03:58 +01:00
|
|
|
class Pdf4QtLIBSHARED_EXPORT PDFFontCache
|
2019-04-12 19:17:19 +02:00
|
|
|
{
|
|
|
|
public:
|
|
|
|
inline explicit PDFFontCache(size_t fontCacheLimit, size_t realizedFontCacheLimit) :
|
|
|
|
m_fontCacheLimit(fontCacheLimit),
|
|
|
|
m_realizedFontCacheLimit(realizedFontCacheLimit),
|
|
|
|
m_document(nullptr)
|
|
|
|
{
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2020-04-25 14:21:06 +02:00
|
|
|
/// Sets the document to the cache. Whole cache is cleared,
|
|
|
|
/// if it is needed.
|
2019-04-12 19:17:19 +02:00
|
|
|
/// \param document Document to be setted
|
2020-04-25 14:21:06 +02:00
|
|
|
void setDocument(const PDFModifiedDocument& document);
|
2019-04-12 19:17:19 +02:00
|
|
|
|
|
|
|
/// Retrieves font from the cache. If font can't be accessed or created,
|
|
|
|
/// then exception is thrown.
|
|
|
|
/// \param fontObject Font object
|
|
|
|
PDFFontPointer getFont(const PDFObject& fontObject) const;
|
|
|
|
|
|
|
|
/// Retrieves realized font from the cache. If realized font can't be accessed or created,
|
|
|
|
/// then exception is thrown.
|
|
|
|
/// \param font Font, which should be realized
|
|
|
|
/// \param size Size of the font (in pixels)
|
2019-10-02 19:37:19 +02:00
|
|
|
/// \param reporter Error reporter
|
|
|
|
PDFRealizedFontPointer getRealizedFont(const PDFFontPointer& font, PDFReal size, PDFRenderErrorReporter* reporter) const;
|
2019-04-12 19:17:19 +02:00
|
|
|
|
2019-12-15 19:28:25 +01:00
|
|
|
/// Sets or unsets font shrinking (i.e. font can be deleted from the cache). In multithreading environment,
|
|
|
|
/// font deletion is not thread safe. For this reason, disable font deletion by calling this function.
|
2020-01-01 18:23:18 +01:00
|
|
|
/// First parameter, \p source determines which object enables cache shrinking (so some objects can
|
|
|
|
/// enable shrinking, while some objects will disable it). Only if all objects enables cache shrinking,
|
|
|
|
/// then cache can shrink.
|
|
|
|
/// \param source Source object
|
|
|
|
/// \param enabled Enable or disable cache shrinking
|
2020-03-07 17:38:50 +01:00
|
|
|
void setCacheShrinkEnabled(const void* source, bool enabled);
|
2019-12-15 19:28:25 +01:00
|
|
|
|
|
|
|
/// Set font cache limits
|
|
|
|
void setCacheLimits(int fontCacheLimit, int instancedFontCacheLimit);
|
|
|
|
|
|
|
|
/// If shrinking is enabled, then erase font, if cache limit is exceeded.
|
|
|
|
void shrink();
|
|
|
|
|
2019-04-12 19:17:19 +02:00
|
|
|
private:
|
2019-12-15 19:28:25 +01:00
|
|
|
size_t m_fontCacheLimit;
|
|
|
|
size_t m_realizedFontCacheLimit;
|
2019-04-12 19:17:19 +02:00
|
|
|
mutable QMutex m_mutex;
|
|
|
|
const PDFDocument* m_document;
|
|
|
|
mutable std::map<PDFObjectReference, PDFFontPointer> m_fontCache;
|
|
|
|
mutable std::map<std::pair<PDFFontPointer, PDFReal>, PDFRealizedFontPointer> m_realizedFontCache;
|
2020-03-07 17:38:50 +01:00
|
|
|
mutable std::set<const void*> m_fontCacheShrinkDisabledObjects;
|
2019-04-12 19:17:19 +02:00
|
|
|
};
|
|
|
|
|
2019-04-27 14:14:07 +02:00
|
|
|
/// Performs mapping from CID to GID (even identity mapping, if byte array is empty)
|
|
|
|
class PDFCIDtoGIDMapper
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
explicit inline PDFCIDtoGIDMapper(QByteArray&& mapping) : m_mapping(qMove(mapping)) { }
|
|
|
|
|
|
|
|
/// Maps CID to GID (glyph identifier)
|
|
|
|
GID map(CID cid) const
|
|
|
|
{
|
|
|
|
if (m_mapping.isEmpty())
|
|
|
|
{
|
|
|
|
// This means identity mapping
|
|
|
|
return cid;
|
|
|
|
}
|
|
|
|
else if ((2 * cid + 1) < CID(m_mapping.size()))
|
|
|
|
{
|
|
|
|
return (GID(m_mapping[2 * cid]) << 8) + GID(m_mapping[2 * cid + 1]);
|
|
|
|
}
|
|
|
|
|
|
|
|
// This should occur only in case of bad (damaged) PDF file - because in this case,
|
|
|
|
// encoding is missing. Return invalid glyph index.
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2020-10-25 13:51:57 +01:00
|
|
|
/// Maps GID to CID (inverse mapping)
|
|
|
|
CID unmap(GID gid) const
|
|
|
|
{
|
|
|
|
if (m_mapping.isEmpty())
|
|
|
|
{
|
|
|
|
// This means identity mapping
|
|
|
|
return gid;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
CID lastCid = CID(m_mapping.size() / 2);
|
|
|
|
for (CID i = 0; i < lastCid; ++i)
|
|
|
|
{
|
|
|
|
if (map(i) == gid)
|
|
|
|
{
|
|
|
|
return i;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// This should occur only in case of bad (damaged) PDF file - because in this case,
|
|
|
|
// encoding is missing. Return invalid character index.
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2019-04-27 14:14:07 +02:00
|
|
|
private:
|
|
|
|
QByteArray m_mapping;
|
|
|
|
};
|
|
|
|
|
|
|
|
/// Represents a font CMAP (mapping of CIDs)
|
2020-12-20 19:03:58 +01:00
|
|
|
class Pdf4QtLIBSHARED_EXPORT PDFFontCMap
|
2019-04-27 14:14:07 +02:00
|
|
|
{
|
|
|
|
public:
|
2021-03-06 18:13:21 +01:00
|
|
|
explicit PDFFontCMap() = default;
|
2019-04-27 14:14:07 +02:00
|
|
|
|
|
|
|
/// Returns true, if mapping is valid
|
|
|
|
bool isValid() const { return !m_entries.empty(); }
|
|
|
|
|
|
|
|
/// Creates mapping from name (name must be one of predefined names)
|
|
|
|
static PDFFontCMap createFromName(const QByteArray& name);
|
|
|
|
|
|
|
|
/// Creates mapping from data (data must be a byte array containing the CMap)
|
|
|
|
static PDFFontCMap createFromData(const QByteArray& data);
|
|
|
|
|
|
|
|
/// Serializes the CMap to the byte array
|
|
|
|
QByteArray serialize() const;
|
|
|
|
|
|
|
|
/// Deserializes the CMap from the byte array
|
|
|
|
static PDFFontCMap deserialize(const QByteArray& byteArray);
|
|
|
|
|
|
|
|
/// Converts byte array to array of CIDs
|
|
|
|
std::vector<CID> interpret(const QByteArray& byteArray) const;
|
|
|
|
|
2019-05-03 18:06:00 +02:00
|
|
|
/// Converts CID to QChar, use only on ToUnicode CMaps
|
|
|
|
QChar getToUnicode(CID cid) const;
|
|
|
|
|
2019-04-27 14:14:07 +02:00
|
|
|
private:
|
|
|
|
|
|
|
|
struct Entry
|
|
|
|
{
|
|
|
|
constexpr explicit inline Entry() = default;
|
|
|
|
constexpr explicit inline Entry(unsigned int from, unsigned int to, unsigned int byteCount, CID cid) : from(from), to(to), byteCount(byteCount), cid(cid) { }
|
|
|
|
|
|
|
|
unsigned int from = 0;
|
|
|
|
unsigned int to = 0;
|
|
|
|
unsigned int byteCount = 0;
|
|
|
|
CID cid = 0;
|
|
|
|
|
|
|
|
// Can merge from other CID entry?
|
|
|
|
bool canMerge(const Entry& other) const
|
|
|
|
{
|
|
|
|
const bool sameBytes = byteCount == other.byteCount;
|
|
|
|
const bool compatibleRange = (to + 1) == other.from;
|
|
|
|
const bool compatibleCID = (cid + to + 1) - from == other.cid;
|
|
|
|
return sameBytes && compatibleRange && compatibleCID;
|
|
|
|
}
|
|
|
|
|
|
|
|
inline constexpr Entry merge(const Entry& other) const
|
|
|
|
{
|
|
|
|
return Entry(from, other.to, byteCount, cid);
|
|
|
|
}
|
|
|
|
|
|
|
|
inline constexpr bool operator<(const Entry& other) const
|
|
|
|
{
|
|
|
|
return std::tie(byteCount, from) < std::tie(other.byteCount, other.from);
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
using Entries = std::vector<Entry>;
|
|
|
|
|
|
|
|
explicit PDFFontCMap(Entries&& entries, bool vertical);
|
|
|
|
|
|
|
|
/// Optimizes the entries - merges entries, which can be merged. This function
|
|
|
|
/// requires, that entries are sorted.
|
|
|
|
static Entries optimize(const Entries& entries);
|
|
|
|
|
|
|
|
Entries m_entries;
|
|
|
|
unsigned int m_maxKeyLength = 0;
|
|
|
|
bool m_vertical = false;
|
|
|
|
};
|
|
|
|
|
2020-08-21 16:37:57 +02:00
|
|
|
class PDFType3Font : public PDFFont
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
explicit PDFType3Font(FontDescriptor fontDescriptor,
|
|
|
|
int firstCharacterIndex,
|
|
|
|
int lastCharacterIndex,
|
|
|
|
QMatrix fontMatrix,
|
|
|
|
std::map<int, QByteArray>&& characterContentStreams,
|
|
|
|
std::vector<double>&& widths,
|
|
|
|
const PDFObject& resources,
|
|
|
|
PDFFontCMap toUnicode);
|
|
|
|
|
|
|
|
virtual FontType getFontType() const override;
|
|
|
|
virtual void dumpFontToTreeItem(QTreeWidgetItem*item) const override;
|
2020-10-24 14:39:09 +02:00
|
|
|
virtual const PDFFontCMap* getToUnicode() const override { return &m_toUnicode; }
|
2020-08-21 16:37:57 +02:00
|
|
|
|
|
|
|
/// Returns width of the character. If character doesn't exist, then zero is returned.
|
|
|
|
double getWidth(int characterIndex) const;
|
|
|
|
|
|
|
|
/// Return content stream for the character. If character doesn't exist, then nullptr
|
|
|
|
/// is returned.
|
|
|
|
const QByteArray* getContentStream(int characterIndex) const;
|
|
|
|
|
|
|
|
const QMatrix& getFontMatrix() const { return m_fontMatrix; }
|
|
|
|
const PDFObject& getResources() const { return m_resources; }
|
2020-10-25 13:51:57 +01:00
|
|
|
const std::map<int, QByteArray>& getContentStreams() const { return m_characterContentStreams; }
|
2020-08-21 16:37:57 +02:00
|
|
|
|
|
|
|
/// Returns unicode character for given character index. If unicode mapping is not
|
|
|
|
/// present, empty (null) character is returned.
|
|
|
|
QChar getUnicode(int characterIndex) const { return m_toUnicode.getToUnicode(characterIndex); }
|
|
|
|
|
|
|
|
private:
|
|
|
|
int m_firstCharacterIndex;
|
|
|
|
int m_lastCharacterIndex;
|
|
|
|
QMatrix m_fontMatrix;
|
|
|
|
std::map<int, QByteArray> m_characterContentStreams;
|
|
|
|
std::vector<double> m_widths;
|
|
|
|
PDFObject m_resources;
|
|
|
|
PDFFontCMap m_toUnicode;
|
|
|
|
};
|
|
|
|
|
2019-04-27 14:14:07 +02:00
|
|
|
/// Composite font (CID-keyed font)
|
|
|
|
class PDFType0Font : public PDFFont
|
|
|
|
{
|
|
|
|
public:
|
2019-05-03 18:06:00 +02:00
|
|
|
explicit inline PDFType0Font(FontDescriptor fontDescriptor, PDFFontCMap cmap, PDFFontCMap toUnicode, PDFCIDtoGIDMapper mapper, PDFReal defaultAdvance, std::unordered_map<CID, PDFReal> advances) :
|
2019-04-27 14:14:07 +02:00
|
|
|
PDFFont(qMove(fontDescriptor)),
|
|
|
|
m_cmap(qMove(cmap)),
|
2019-05-03 18:06:00 +02:00
|
|
|
m_toUnicode(qMove(toUnicode)),
|
2019-04-30 18:38:27 +02:00
|
|
|
m_mapper(qMove(mapper)),
|
|
|
|
m_defaultAdvance(defaultAdvance),
|
|
|
|
m_advances(qMove(advances))
|
2019-04-27 14:14:07 +02:00
|
|
|
{
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
virtual ~PDFType0Font() = default;
|
|
|
|
|
|
|
|
virtual FontType getFontType() const override { return FontType::Type0; }
|
2020-10-24 14:39:09 +02:00
|
|
|
virtual const PDFFontCMap* getToUnicode() const override { return &m_toUnicode; }
|
2019-04-27 14:14:07 +02:00
|
|
|
|
|
|
|
const PDFFontCMap* getCMap() const { return &m_cmap; }
|
|
|
|
const PDFCIDtoGIDMapper* getCIDtoGIDMapper() const { return &m_mapper; }
|
|
|
|
|
2019-04-30 18:38:27 +02:00
|
|
|
/// Returns the glyph advance, if it can be obtained, or zero, if it cannot
|
|
|
|
/// be obtained or error occurs.
|
|
|
|
/// \param cid CID of the glyph
|
|
|
|
PDFReal getGlyphAdvance(CID cid) const;
|
|
|
|
|
2019-04-27 14:14:07 +02:00
|
|
|
private:
|
|
|
|
PDFFontCMap m_cmap;
|
2019-05-03 18:06:00 +02:00
|
|
|
PDFFontCMap m_toUnicode;
|
2019-04-27 14:14:07 +02:00
|
|
|
PDFCIDtoGIDMapper m_mapper;
|
2019-04-30 18:38:27 +02:00
|
|
|
PDFReal m_defaultAdvance;
|
|
|
|
std::unordered_map<CID, PDFReal> m_advances;
|
2019-04-27 14:14:07 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
/// Repository with predefined CMaps
|
2020-12-20 19:03:58 +01:00
|
|
|
class Pdf4QtLIBSHARED_EXPORT PDFFontCMapRepository
|
2019-04-27 14:14:07 +02:00
|
|
|
{
|
|
|
|
public:
|
|
|
|
/// Returns instance of CMAP repository
|
|
|
|
static PDFFontCMapRepository* getInstance();
|
|
|
|
|
|
|
|
/// Adds CMAP to the repository
|
|
|
|
void add(const QByteArray& key, QByteArray value) { m_cmaps[key] = qMove(value); }
|
|
|
|
|
|
|
|
/// Clears the repository
|
|
|
|
void clear() { m_cmaps.clear(); }
|
|
|
|
|
|
|
|
/// Saves the repository content to the file
|
|
|
|
void saveToFile(const QString& fileName) const;
|
|
|
|
|
|
|
|
/// Loads the repository content from the file
|
|
|
|
bool loadFromFile(const QString& fileName);
|
|
|
|
|
|
|
|
private:
|
|
|
|
explicit PDFFontCMapRepository();
|
|
|
|
|
|
|
|
/// Storage for predefined cmaps
|
|
|
|
std::map<QByteArray, QByteArray> m_cmaps;
|
|
|
|
};
|
|
|
|
|
2019-03-25 18:44:45 +01:00
|
|
|
} // namespace pdf
|
|
|
|
|
|
|
|
#endif // PDFFONT_H
|