2021-04-30 20:12:10 +02:00
// Copyright (C) 2019-2021 Jakub Melka
2019-05-07 18:21:22 +02:00
//
2020-12-20 19:03:58 +01:00
// This file is part of Pdf4Qt.
2019-05-07 18:21:22 +02:00
//
2020-12-20 19:03:58 +01:00
// Pdf4Qt is free software: you can redistribute it and/or modify
2019-05-07 18:21:22 +02:00
// it under the terms of the GNU Lesser General Public License as published by
// the Free Software Foundation, either version 3 of the License, or
2021-04-30 20:12:10 +02:00
// with the written consent of the copyright owner, any later version.
2019-05-07 18:21:22 +02:00
//
2020-12-20 19:03:58 +01:00
// Pdf4Qt is distributed in the hope that it will be useful,
2019-05-07 18:21:22 +02:00
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU Lesser General Public License for more details.
//
// You should have received a copy of the GNU Lesser General Public License
2020-12-20 19:03:58 +01:00
// along with Pdf4Qt. If not, see <https://www.gnu.org/licenses/>.
2019-05-07 18:21:22 +02:00
# include "pdfimage.h"
# include "pdfdocument.h"
# include "pdfconstants.h"
# include "pdfexception.h"
2019-06-15 17:40:22 +02:00
# include "pdfutils.h"
2019-10-26 18:02:37 +02:00
# include "pdfjbig2decoder.h"
2019-10-13 19:02:38 +02:00
# include "pdfccittfaxdecoder.h"
2019-05-07 18:21:22 +02:00
# include <openjpeg.h>
# include <jpeglib.h>
namespace pdf
{
struct PDFJPEG2000ImageData
{
const QByteArray * byteArray = nullptr ;
OPJ_SIZE_T position = 0 ;
2019-05-10 19:48:52 +02:00
std : : vector < PDFRenderError > errors ;
2019-05-07 18:21:22 +02:00
static OPJ_SIZE_T read ( void * p_buffer , OPJ_SIZE_T p_nb_bytes , void * p_user_data ) ;
static OPJ_BOOL seek ( OPJ_OFF_T p_nb_bytes , void * p_user_data ) ;
static OPJ_OFF_T skip ( OPJ_OFF_T p_nb_bytes , void * p_user_data ) ;
} ;
struct PDFJPEGDCTSource
{
jpeg_source_mgr sourceManager ;
const QByteArray * buffer = nullptr ;
2019-09-14 19:14:01 +02:00
int startByte = 0 ;
2019-05-07 18:21:22 +02:00
} ;
2019-10-18 17:28:45 +02:00
PDFImage PDFImage : : createImage ( const PDFDocument * document ,
const PDFStream * stream ,
PDFColorSpacePointer colorSpace ,
bool isSoftMask ,
RenderingIntent renderingIntent ,
PDFRenderErrorReporter * errorReporter )
2019-05-07 18:21:22 +02:00
{
PDFImage image ;
image . m_colorSpace = colorSpace ;
2019-10-18 17:28:45 +02:00
image . m_renderingIntent = renderingIntent ;
2019-05-07 18:21:22 +02:00
const PDFDictionary * dictionary = stream - > getDictionary ( ) ;
QByteArray content = document - > getDecodedStream ( stream ) ;
PDFDocumentDataLoaderDecorator loader ( document ) ;
if ( content . isEmpty ( ) )
{
2019-09-27 18:41:56 +02:00
throw PDFException ( PDFTranslationContext : : tr ( " Image has not data. " ) ) ;
2019-05-07 18:21:22 +02:00
}
2019-06-15 14:29:49 +02:00
PDFImageData : : MaskingType maskingType = PDFImageData : : MaskingType : : None ;
std : : vector < PDFInteger > mask ;
2019-06-15 17:40:22 +02:00
std : : vector < PDFReal > decode = loader . readNumberArrayFromDictionary ( dictionary , " Decode " ) ;
bool imageMask = loader . readBooleanFromDictionary ( dictionary , " ImageMask " , false ) ;
2019-10-05 15:11:53 +02:00
std : : vector < PDFReal > matte = loader . readNumberArrayFromDictionary ( dictionary , " Matte " ) ;
2019-10-19 14:17:50 +02:00
PDFInteger sMaskInData = loader . readIntegerFromDictionary ( dictionary , " SMaskInData " , 0 ) ;
2020-08-15 15:57:55 +02:00
image . m_interpolate = loader . readBooleanFromDictionary ( dictionary , " Interpolate " , false ) ;
image . m_alternates = loader . readObjectList < PDFAlternateImage > ( dictionary - > get ( " Alternates " ) ) ;
image . m_name = loader . readNameFromDictionary ( dictionary , " Name " ) ;
image . m_structuralParent = loader . readIntegerFromDictionary ( dictionary , " StructParent " , 0 ) ;
image . m_webCaptureContentSetId = loader . readStringFromDictionary ( dictionary , " ID " ) ;
image . m_OPI = dictionary - > get ( " OPI " ) ;
image . m_OC = dictionary - > get ( " OC " ) ;
image . m_metadata = dictionary - > get ( " Metadata " ) ;
image . m_associatedFiles = dictionary - > get ( " AF " ) ;
image . m_measure = dictionary - > get ( " Measure " ) ;
image . m_pointData = dictionary - > get ( " PtData " ) ;
2019-10-05 15:11:53 +02:00
if ( isSoftMask & & ( imageMask | | dictionary - > hasKey ( " Mask " ) | | dictionary - > hasKey ( " SMask " ) ) )
{
2019-10-05 17:38:15 +02:00
throw PDFRendererException ( RenderErrorType : : Error , PDFTranslationContext : : tr ( " Soft mask image can't have mask / soft mask itself. " ) ) ;
2019-10-05 15:11:53 +02:00
}
if ( ! isSoftMask & & ! matte . empty ( ) )
{
2019-10-05 17:38:15 +02:00
throw PDFRendererException ( RenderErrorType : : Error , PDFTranslationContext : : tr ( " Regular image can't have Matte entry (used for soft masks) . " )) ;
2019-10-05 15:11:53 +02:00
}
2019-06-15 14:29:49 +02:00
2019-10-18 17:28:45 +02:00
// Set rendering intent
if ( dictionary - > hasKey ( " Intent " ) )
{
QByteArray renderingIntentName = loader . readNameFromDictionary ( dictionary , " Intent " ) ;
if ( renderingIntentName = = " Perceptual " )
{
image . m_renderingIntent = RenderingIntent : : Perceptual ;
}
else if ( renderingIntentName = = " AbsoluteColorimetric " )
{
image . m_renderingIntent = RenderingIntent : : AbsoluteColorimetric ;
}
else if ( renderingIntentName = = " RelativeColorimetric " )
{
image . m_renderingIntent = RenderingIntent : : RelativeColorimetric ;
}
else if ( renderingIntentName = = " Saturation " )
{
image . m_renderingIntent = RenderingIntent : : Saturation ;
}
}
2019-06-15 14:29:49 +02:00
// Fill Mask
if ( dictionary - > hasKey ( " Mask " ) )
{
const PDFObject & object = document - > getObject ( dictionary - > get ( " Mask " ) ) ;
if ( object . isArray ( ) )
{
maskingType = PDFImageData : : MaskingType : : ColorKeyMasking ;
mask = loader . readIntegerArray ( object ) ;
}
else if ( object . isStream ( ) )
{
2019-10-19 11:08:37 +02:00
PDFImage softMaskImage = createImage ( document , object . getStream ( ) , colorSpace , false , renderingIntent , errorReporter ) ;
if ( softMaskImage . m_imageData . getMaskingType ( ) ! = PDFImageData : : MaskingType : : ImageMask | |
softMaskImage . m_imageData . getColorChannels ( ) ! = 1 | |
softMaskImage . m_imageData . getBitsPerComponent ( ) ! = 1 )
{
throw PDFRendererException ( RenderErrorType : : NotImplemented , PDFTranslationContext : : tr ( " Invalid mask image. " ) ) ;
}
// We must alter decode, because it has opposite meaning (it is transparency)
std : : vector < PDFReal > decode = softMaskImage . m_imageData . getDecode ( ) ;
if ( decode . size ( ) < 2 )
{
decode = { 0.0 , 1.0 } ;
}
std : : swap ( decode [ 0 ] , decode [ 1 ] ) ;
// Create soft mask from image
maskingType = PDFImageData : : MaskingType : : SoftMask ;
image . m_softMask = qMove ( softMaskImage . m_imageData ) ;
image . m_softMask . setMaskingType ( PDFImageData : : MaskingType : : None ) ;
image . m_softMask . setDecode ( qMove ( decode ) ) ;
2019-06-15 14:29:49 +02:00
}
}
2019-10-05 15:11:53 +02:00
else if ( dictionary - > hasKey ( " SMask " ) )
{
// Parse soft mask image
const PDFObject & softMaskObject = document - > getObject ( dictionary - > get ( " SMask " ) ) ;
if ( softMaskObject . isStream ( ) )
{
2019-10-18 17:28:45 +02:00
PDFImage softMaskImage = createImage ( document , softMaskObject . getStream ( ) , PDFColorSpacePointer ( new PDFDeviceGrayColorSpace ( ) ) , true , renderingIntent , errorReporter ) ;
2019-10-05 15:11:53 +02:00
maskingType = PDFImageData : : MaskingType : : SoftMask ;
image . m_softMask = qMove ( softMaskImage . m_imageData ) ;
}
else if ( ! softMaskObject . isNull ( ) )
{
throw PDFRendererException ( RenderErrorType : : NotImplemented , PDFTranslationContext : : tr ( " Invalid soft mask object. " ) ) ;
}
}
2019-06-15 14:29:49 +02:00
2019-06-15 17:40:22 +02:00
if ( imageMask )
{
maskingType = PDFImageData : : MaskingType : : ImageMask ;
}
2019-05-07 18:21:22 +02:00
// Retrieve filters
PDFObject filters ;
if ( dictionary - > hasKey ( PDF_STREAM_DICT_FILTER ) )
{
filters = document - > getObject ( dictionary - > get ( PDF_STREAM_DICT_FILTER ) ) ;
}
else if ( dictionary - > hasKey ( PDF_STREAM_DICT_FILE_FILTER ) )
{
filters = document - > getObject ( dictionary - > get ( PDF_STREAM_DICT_FILE_FILTER ) ) ;
}
// Retrieve filter parameters
PDFObject filterParameters ;
if ( dictionary - > hasKey ( PDF_STREAM_DICT_DECODE_PARMS ) )
{
filterParameters = document - > getObject ( dictionary - > get ( PDF_STREAM_DICT_DECODE_PARMS ) ) ;
}
else if ( dictionary - > hasKey ( PDF_STREAM_DICT_FDECODE_PARMS ) )
{
filterParameters = document - > getObject ( dictionary - > get ( PDF_STREAM_DICT_FDECODE_PARMS ) ) ;
}
QByteArray imageFilterName ;
if ( filters . isName ( ) )
{
imageFilterName = filters . getString ( ) ;
}
else if ( filters . isArray ( ) )
{
const PDFArray * filterArray = filters . getArray ( ) ;
const size_t filterCount = filterArray - > getCount ( ) ;
if ( filterCount )
{
const PDFObject & object = document - > getObject ( filterArray - > getItem ( filterCount - 1 ) ) ;
if ( object . isName ( ) )
{
imageFilterName = object . getString ( ) ;
}
}
}
2019-10-13 19:02:38 +02:00
const PDFDictionary * filterParamsDictionary = nullptr ;
if ( filterParameters . isDictionary ( ) )
{
filterParamsDictionary = filterParameters . getDictionary ( ) ;
}
else if ( filterParameters . isArray ( ) )
{
const PDFArray * filterParametersArray = filterParameters . getArray ( ) ;
const size_t filterParamsCount = filterParametersArray - > getCount ( ) ;
if ( filterParamsCount )
{
const PDFObject & object = document - > getObject ( filterParametersArray - > getItem ( filterParamsCount - 1 ) ) ;
if ( object . isDictionary ( ) )
{
filterParamsDictionary = object . getDictionary ( ) ;
}
}
}
2019-05-07 18:21:22 +02:00
if ( imageFilterName = = " DCTDecode " | | imageFilterName = = " DCT " )
{
int colorTransform = loader . readIntegerFromDictionary ( dictionary , " ColorTransform " , - 1 ) ;
jpeg_decompress_struct codec ;
jpeg_error_mgr errorManager ;
std : : memset ( & codec , 0 , sizeof ( jpeg_decompress_struct ) ) ;
std : : memset ( & errorManager , 0 , sizeof ( errorManager ) ) ;
PDFJPEGDCTSource source ;
source . buffer = & content ;
std : : memset ( & source . sourceManager , 0 , sizeof ( jpeg_source_mgr ) ) ;
2019-09-14 19:14:01 +02:00
// Fix issue, that image doesn't start with FFD8 (start of image marker). If this
// occurs, try to find sequence FFD8, and if we can find it, then advance the buffer.
source . startByte = qMax ( content . indexOf ( " \xFF \xD8 " ) , 0 ) ;
if ( source . startByte > 0 )
{
errorReporter - > reportRenderError ( RenderErrorType : : Warning , PDFTranslationContext : : tr ( " Malformed data while reading JPEG stream. %1 bytes skipped. " ) . arg ( source . startByte ) ) ;
}
2019-05-07 18:21:22 +02:00
auto errorMethod = [ ] ( j_common_ptr ptr )
{
char buffer [ JMSG_LENGTH_MAX ] = { } ;
( ptr - > err - > format_message ) ( ptr , buffer ) ;
jpeg_destroy ( ptr ) ;
2019-09-27 18:41:56 +02:00
throw PDFException ( PDFTranslationContext : : tr ( " Error reading JPEG (DCT) image : % 1. " ).arg(QString::fromLatin1(buffer))) ;
2019-05-07 18:21:22 +02:00
} ;
auto fillInputBufferMethod = [ ] ( j_decompress_ptr decompress ) - > boolean
{
PDFJPEGDCTSource * source = reinterpret_cast < PDFJPEGDCTSource * > ( decompress - > src ) ;
if ( ! source - > sourceManager . next_input_byte )
{
const QByteArray * buffer = source - > buffer ;
source - > sourceManager . next_input_byte = reinterpret_cast < const JOCTET * > ( buffer - > constData ( ) ) ;
source - > sourceManager . bytes_in_buffer = buffer - > size ( ) ;
2019-09-14 19:14:01 +02:00
source - > sourceManager . next_input_byte + = source - > startByte ;
source - > sourceManager . bytes_in_buffer - = source - > startByte ;
2019-05-07 18:21:22 +02:00
return TRUE ;
}
return FALSE ;
} ;
auto skipInputDataMethod = [ ] ( j_decompress_ptr decompress , long num_bytes )
{
PDFJPEGDCTSource * source = reinterpret_cast < PDFJPEGDCTSource * > ( decompress - > src ) ;
const size_t skippedBytes = qMin ( source - > sourceManager . bytes_in_buffer , static_cast < size_t > ( num_bytes ) ) ;
source - > sourceManager . next_input_byte + = skippedBytes ;
source - > sourceManager . bytes_in_buffer - = skippedBytes ;
} ;
source . sourceManager . bytes_in_buffer = 0 ;
source . sourceManager . next_input_byte = nullptr ;
source . sourceManager . init_source = [ ] ( j_decompress_ptr ) { } ;
source . sourceManager . fill_input_buffer = fillInputBufferMethod ;
source . sourceManager . skip_input_data = skipInputDataMethod ;
source . sourceManager . resync_to_restart = jpeg_resync_to_restart ;
source . sourceManager . term_source = [ ] ( j_decompress_ptr ) { } ;
jpeg_std_error ( & errorManager ) ;
errorManager . error_exit = errorMethod ;
codec . err = & errorManager ;
jpeg_create_decompress ( & codec ) ;
codec . src = reinterpret_cast < jpeg_source_mgr * > ( & source ) ;
if ( jpeg_read_header ( & codec , TRUE ) = = JPEG_HEADER_OK )
{
// Determine color transform
if ( colorTransform = = - 1 & & codec . saw_Adobe_marker )
{
colorTransform = codec . Adobe_transform ;
}
// Set the input transform
if ( colorTransform > - 1 )
{
switch ( codec . num_components )
{
case 3 :
{
codec . jpeg_color_space = colorTransform ? JCS_YCbCr : JCS_RGB ;
break ;
}
case 4 :
{
codec . jpeg_color_space = colorTransform ? JCS_YCCK : JCS_CMYK ;
break ;
}
default :
break ;
}
}
jpeg_start_decompress ( & codec ) ;
const JDIMENSION rowStride = codec . output_width * codec . output_components ;
JSAMPARRAY samples = codec . mem - > alloc_sarray ( reinterpret_cast < j_common_ptr > ( & codec ) , JPOOL_IMAGE , rowStride , 1 ) ;
JDIMENSION scanLineCount = codec . output_height ;
const unsigned int width = codec . output_width ;
const unsigned int height = codec . output_height ;
const unsigned int components = codec . output_components ;
const unsigned int bitsPerComponent = 8 ;
QByteArray buffer ( rowStride * height , 0 ) ;
JSAMPROW rowData = reinterpret_cast < JSAMPROW > ( buffer . data ( ) ) ;
while ( scanLineCount )
{
JDIMENSION readCount = jpeg_read_scanlines ( & codec , samples , 1 ) ;
std : : memcpy ( rowData , samples [ 0 ] , rowStride ) ;
scanLineCount - = readCount ;
rowData + = rowStride ;
}
jpeg_finish_decompress ( & codec ) ;
2019-10-05 15:11:53 +02:00
image . m_imageData = PDFImageData ( components , bitsPerComponent , width , height , rowStride , maskingType , qMove ( buffer ) , qMove ( mask ) , qMove ( decode ) , qMove ( matte ) ) ;
2019-05-07 18:21:22 +02:00
}
jpeg_destroy_decompress ( & codec ) ;
}
else if ( imageFilterName = = " JPXDecode " )
{
PDFJPEG2000ImageData imageData ;
imageData . byteArray = & content ;
imageData . position = 0 ;
2019-05-10 19:48:52 +02:00
auto warningCallback = [ ] ( const char * message , void * userData )
{
PDFJPEG2000ImageData * data = reinterpret_cast < PDFJPEG2000ImageData * > ( userData ) ;
data - > errors . push_back ( PDFRenderError ( RenderErrorType : : Warning , PDFTranslationContext : : tr ( " JPEG 2000 Warning: %1 " ) . arg ( QString : : fromLatin1 ( message ) ) ) ) ;
} ;
auto errorCallback = [ ] ( const char * message , void * userData )
{
PDFJPEG2000ImageData * data = reinterpret_cast < PDFJPEG2000ImageData * > ( userData ) ;
data - > errors . push_back ( PDFRenderError ( RenderErrorType : : Error , PDFTranslationContext : : tr ( " JPEG 2000 Error: %1 " ) . arg ( QString : : fromLatin1 ( message ) ) ) ) ;
} ;
2019-05-07 18:21:22 +02:00
opj_dparameters_t decompressParameters ;
opj_set_default_decoder_parameters ( & decompressParameters ) ;
2019-05-12 14:59:08 +02:00
const bool isIndexed = dynamic_cast < const PDFIndexedColorSpace * > ( image . m_colorSpace . data ( ) ) ;
if ( isIndexed )
{
// What is this flag for? When we have indexed color space, we do not want to resolve index to color
// using the color map in the image. Instead of that, we just get indices and resolve them using
// our color space.
decompressParameters . flags | = OPJ_DPARAMETERS_IGNORE_PCLR_CMAP_CDEF_FLAG ;
}
2019-05-10 19:48:52 +02:00
constexpr CODEC_FORMAT formats [ ] = { OPJ_CODEC_J2K , OPJ_CODEC_JP2 , OPJ_CODEC_JPT , OPJ_CODEC_JPP , OPJ_CODEC_JPX } ;
2019-05-07 18:21:22 +02:00
for ( CODEC_FORMAT format : formats )
{
opj_codec_t * codec = opj_create_decompress ( format ) ;
if ( ! codec )
{
// Codec is not present
continue ;
}
2019-05-10 19:48:52 +02:00
opj_set_warning_handler ( codec , warningCallback , & imageData ) ;
opj_set_error_handler ( codec , errorCallback , & imageData ) ;
opj_stream_t * stream = opj_stream_create ( content . size ( ) , OPJ_TRUE ) ;
opj_stream_set_user_data ( stream , & imageData , nullptr ) ;
opj_stream_set_user_data_length ( stream , content . size ( ) ) ;
opj_stream_set_read_function ( stream , & PDFJPEG2000ImageData : : read ) ;
opj_stream_set_seek_function ( stream , & PDFJPEG2000ImageData : : seek ) ;
opj_stream_set_skip_function ( stream , & PDFJPEG2000ImageData : : skip ) ;
2019-05-07 18:21:22 +02:00
2019-05-10 19:48:52 +02:00
// Reset the stream position, clear the data
imageData . position = 0 ;
imageData . errors . clear ( ) ;
opj_image_t * jpegImage = nullptr ;
// Setup the decoder
if ( opj_setup_decoder ( codec , & decompressParameters ) )
2019-05-07 18:21:22 +02:00
{
2019-05-10 19:48:52 +02:00
// Try to read the header
if ( opj_read_header ( stream , codec , & jpegImage ) )
2019-05-07 18:21:22 +02:00
{
2019-05-10 19:48:52 +02:00
if ( opj_set_decode_area ( codec , jpegImage , decompressParameters . DA_x0 , decompressParameters . DA_y0 , decompressParameters . DA_x1 , decompressParameters . DA_y1 ) )
2019-05-07 18:21:22 +02:00
{
2019-05-10 19:48:52 +02:00
if ( opj_decode ( codec , stream , jpegImage ) )
2019-05-07 18:21:22 +02:00
{
2019-05-10 19:48:52 +02:00
if ( opj_end_decompress ( codec , stream ) )
{
2019-05-07 18:21:22 +02:00
2019-05-10 19:48:52 +02:00
}
2019-05-07 18:21:22 +02:00
}
}
}
}
2019-05-10 19:48:52 +02:00
opj_stream_destroy ( stream ) ;
2019-05-07 18:21:22 +02:00
opj_destroy_codec ( codec ) ;
2019-05-10 19:48:52 +02:00
stream = nullptr ;
codec = nullptr ;
// If we have a valid image, then adjust it
if ( jpegImage )
{
2019-10-19 14:17:50 +02:00
// This image type can have color space defined in the data (definition of color space in PDF
// is only optional). So, if we doesn't have a color space, then we must determine it from the data.
if ( ! image . m_colorSpace )
{
switch ( jpegImage - > color_space )
{
case OPJ_CLRSPC_SRGB :
image . m_colorSpace . reset ( new PDFDeviceRGBColorSpace ( ) ) ;
break ;
case OPJ_CLRSPC_GRAY :
image . m_colorSpace . reset ( new PDFDeviceGrayColorSpace ( ) ) ;
break ;
case OPJ_CLRSPC_CMYK :
image . m_colorSpace . reset ( new PDFDeviceCMYKColorSpace ( ) ) ;
break ;
default :
imageData . errors . push_back ( PDFRenderError ( RenderErrorType : : Error , PDFTranslationContext : : tr ( " Unknown color space for JPEG 2000 image. " ) ) ) ;
break ;
}
2020-07-10 17:08:22 +02:00
// Jakub Melka: Try to use ICC profile, if image has it
if ( jpegImage - > icc_profile_buf & & jpegImage - > icc_profile_len > 0 & & image . m_colorSpace )
{
QByteArray iccProfileData ( reinterpret_cast < const char * > ( jpegImage - > icc_profile_buf ) , jpegImage - > icc_profile_len ) ;
PDFICCBasedColorSpace : : Ranges ranges = { 0.0 , 1.0 , 0.0 , 1.0 , 0.0 , 1.0 , 0.0 , 1.0 } ;
2020-08-11 17:46:03 +02:00
image . m_colorSpace . reset ( new PDFICCBasedColorSpace ( image . m_colorSpace , ranges , qMove ( iccProfileData ) , PDFObjectReference ( ) ) ) ;
2020-07-10 17:08:22 +02:00
}
2019-10-19 14:17:50 +02:00
}
2019-05-10 19:48:52 +02:00
// First we must check, if all components are valid (i.e has same width/height/precision)
2019-10-19 14:17:50 +02:00
std : : vector < OPJ_UINT32 > ordinaryComponents ;
std : : vector < OPJ_UINT32 > alphaComponents ;
2019-05-10 19:48:52 +02:00
bool valid = true ;
const OPJ_UINT32 componentCount = jpegImage - > numcomps ;
2019-10-19 14:17:50 +02:00
ordinaryComponents . reserve ( componentCount ) ;
for ( OPJ_UINT32 i = 0 ; i < componentCount ; + + i )
2019-05-10 19:48:52 +02:00
{
if ( jpegImage - > comps [ 0 ] . w ! = jpegImage - > comps [ i ] . w | |
jpegImage - > comps [ 0 ] . h ! = jpegImage - > comps [ i ] . h | |
jpegImage - > comps [ 0 ] . prec ! = jpegImage - > comps [ i ] . prec | |
jpegImage - > comps [ 0 ] . sgnd ! = jpegImage - > comps [ i ] . sgnd )
{
valid = false ;
break ;
}
2019-10-19 14:17:50 +02:00
else
{
// Fill in ordinary component, or alpha component
if ( ! jpegImage - > comps [ i ] . alpha )
{
ordinaryComponents . push_back ( i ) ;
}
else
{
alphaComponents . push_back ( i ) ;
}
}
2019-05-10 19:48:52 +02:00
}
if ( valid )
{
2019-10-19 14:17:50 +02:00
const size_t colorSpaceComponentCount = image . m_colorSpace - > getColorComponentCount ( ) ;
const bool hasAlphaChannel = ! alphaComponents . empty ( ) ;
if ( colorSpaceComponentCount < ordinaryComponents . size ( ) )
{
// We have too much ordinary components
imageData . errors . push_back ( PDFRenderError ( RenderErrorType : : Warning , PDFTranslationContext : : tr ( " JPEG 2000 image has too much non-alpha channels. Ignoring %1 channels. " ) . arg ( ordinaryComponents . size ( ) - colorSpaceComponentCount ) ) ) ;
}
if ( alphaComponents . size ( ) > 1 )
{
// We support only one alpha channel component
imageData . errors . push_back ( PDFRenderError ( RenderErrorType : : Warning , PDFTranslationContext : : tr ( " JPEG 2000 image has too much alpha channels. Ignoring %1 alpha channels. " ) . arg ( alphaComponents . size ( ) - 1 ) ) ) ;
}
2019-05-10 19:48:52 +02:00
const OPJ_UINT32 w = jpegImage - > comps [ 0 ] . w ;
const OPJ_UINT32 h = jpegImage - > comps [ 0 ] . h ;
const OPJ_UINT32 prec = jpegImage - > comps [ 0 ] . prec ;
const OPJ_UINT32 sgnd = jpegImage - > comps [ 0 ] . sgnd ;
int signumCorrection = ( sgnd ) ? ( 1 < < ( prec - 1 ) ) : 0 ;
int shiftLeft = ( jpegImage - > comps [ 0 ] . prec < 8 ) ? 8 - jpegImage - > comps [ 0 ] . prec : 0 ;
int shiftRight = ( jpegImage - > comps [ 0 ] . prec > 8 ) ? jpegImage - > comps [ 0 ] . prec - 8 : 0 ;
auto transformValue = [ signumCorrection , isIndexed , shiftLeft , shiftRight ] ( int value ) - > unsigned char
{
value + = signumCorrection ;
if ( ! isIndexed )
{
// Indexed color space should have at most 255 indices, do not modify indices in this case
if ( shiftLeft > 0 )
{
value = value < < shiftLeft ;
}
else if ( shiftRight > 0 )
{
// We clamp value to the lower part (so, we use similar algorithm as in 'floor' function).
//
value = value > > shiftRight ;
}
}
value = qBound ( 0 , value , 255 ) ;
return static_cast < unsigned char > ( value ) ;
} ;
// Variables for image data. We convert all components to the 8-bit format
2019-10-19 14:17:50 +02:00
const size_t ordinaryComponentCount = ordinaryComponents . size ( ) ;
unsigned int components = static_cast < unsigned int > ( qMin ( ordinaryComponentCount , colorSpaceComponentCount ) ) ;
2019-05-10 19:48:52 +02:00
unsigned int bitsPerComponent = 8 ;
unsigned int width = w ;
unsigned int height = h ;
unsigned int stride = w * components ;
QByteArray imageDataBuffer ( components * width * height , 0 ) ;
for ( unsigned int row = 0 ; row < h ; + + row )
{
for ( unsigned int col = 0 ; col < w ; + + col )
{
for ( unsigned int componentIndex = 0 ; componentIndex < components ; + + componentIndex )
{
int index = stride * row + col * components + componentIndex ;
Q_ASSERT ( index < imageDataBuffer . size ( ) ) ;
2019-10-19 14:17:50 +02:00
imageDataBuffer [ index ] = transformValue ( jpegImage - > comps [ ordinaryComponents [ componentIndex ] ] . data [ w * row + col ] ) ;
2019-05-10 19:48:52 +02:00
}
}
}
2019-10-05 15:11:53 +02:00
image . m_imageData = PDFImageData ( components , bitsPerComponent , width , height , stride , maskingType , qMove ( imageDataBuffer ) , qMove ( mask ) , qMove ( decode ) , qMove ( matte ) ) ;
2019-06-15 14:29:49 +02:00
valid = image . m_imageData . isValid ( ) ;
2019-10-19 14:17:50 +02:00
// Handle the alpha channel buffer - create soft mask. If SMaskInData equals to 1, then alpha channel is used.
// If SMaskInData equals to 2, then premultiplied alpha channel is used.
if ( hasAlphaChannel & & ( sMaskInData = = 1 | | sMaskInData = = 2 ) )
{
const int alphaStride = w ;
QByteArray alphaDataBuffer ( width * height , 0 ) ;
const OPJ_UINT32 alphaComponentIndex = alphaComponents . front ( ) ;
for ( unsigned int row = 0 ; row < h ; + + row )
{
for ( unsigned int col = 0 ; col < w ; + + col )
{
int index = alphaStride * row + col ;
Q_ASSERT ( index < alphaDataBuffer . size ( ) ) ;
alphaDataBuffer [ index ] = transformValue ( jpegImage - > comps [ alphaComponentIndex ] . data [ w * row + col ] ) ;
}
}
if ( sMaskInData = = 2 )
{
matte . resize ( ordinaryComponentCount , 0.0 ) ;
}
image . m_softMask = PDFImageData ( 1 , bitsPerComponent , width , height , alphaStride , PDFImageData : : MaskingType : : None , qMove ( alphaDataBuffer ) , { } , { } , qMove ( matte ) ) ;
image . m_imageData . setMaskingType ( PDFImageData : : MaskingType : : SoftMask ) ;
}
2019-05-10 19:48:52 +02:00
}
else
{
2019-06-15 14:29:49 +02:00
// Easiest way is to just add errors to the error list
2019-05-10 19:48:52 +02:00
imageData . errors . push_back ( PDFRenderError ( RenderErrorType : : Error , PDFTranslationContext : : tr ( " Incompatible color components for JPEG 2000 image. " ) ) ) ;
}
opj_image_destroy ( jpegImage ) ;
2019-06-15 14:29:49 +02:00
if ( valid )
{
// Image was successfully decoded
break ;
}
2019-05-10 19:48:52 +02:00
}
2019-05-07 18:21:22 +02:00
}
2019-05-10 19:48:52 +02:00
// Report errors, if we have any
if ( ! imageData . errors . empty ( ) )
{
for ( const PDFRenderError & error : imageData . errors )
{
QString message = error . message . simplified ( ) . trimmed ( ) ;
if ( error . type = = RenderErrorType : : Error )
{
throw PDFRendererException ( error . type , message ) ;
}
else
{
errorReporter - > reportRenderError ( error . type , message ) ;
}
}
}
2019-05-07 18:21:22 +02:00
}
2019-10-05 13:08:32 +02:00
else if ( imageFilterName = = " CCITTFaxDecode " | | imageFilterName = = " CCF " )
2019-06-15 14:29:49 +02:00
{
2019-10-13 19:02:38 +02:00
if ( ! filterParamsDictionary )
{
throw PDFRendererException ( RenderErrorType : : Error , PDFTranslationContext : : tr ( " Invalid parameters for filter CCITT fax decode. " ) ) ;
}
PDFCCITTFaxDecoderParameters parameters ;
parameters . maskingType = maskingType ;
parameters . K = loader . readIntegerFromDictionary ( filterParamsDictionary , " K " , 0 ) ;
parameters . hasEndOfLine = loader . readBooleanFromDictionary ( filterParamsDictionary , " EndOfLine " , false ) ;
parameters . hasEncodedByteAlign = loader . readBooleanFromDictionary ( filterParamsDictionary , " EncodedByteAlign " , false ) ;
parameters . columns = loader . readIntegerFromDictionary ( filterParamsDictionary , " Columns " , 1728 ) ;
parameters . rows = loader . readIntegerFromDictionary ( filterParamsDictionary , " Rows " , 0 ) ;
parameters . hasEndOfBlock = loader . readBooleanFromDictionary ( filterParamsDictionary , " EndOfBlock " , true ) ;
parameters . hasBlackIsOne = loader . readBooleanFromDictionary ( filterParamsDictionary , " BlackIs1 " , false ) ;
parameters . damagedRowsBeforeError = loader . readIntegerFromDictionary ( filterParamsDictionary , " DamagedRowsBeforeError " , 0 ) ;
2019-10-18 17:28:45 +02:00
parameters . decode = ! decode . empty ( ) ? qMove ( decode ) : std : : vector < PDFReal > ( { 0.0 , 1.0 } ) ;
2019-10-13 19:02:38 +02:00
QByteArray imageDataBuffer = document - > getDecodedStream ( stream ) ;
PDFCCITTFaxDecoder decoder ( & imageDataBuffer , parameters ) ;
image . m_imageData = decoder . decode ( ) ;
2019-06-15 14:29:49 +02:00
}
else if ( imageFilterName = = " JBIG2Decode " )
{
2019-10-26 18:02:37 +02:00
QByteArray data = document - > getDecodedStream ( stream ) ;
QByteArray globalData ;
if ( filterParamsDictionary )
{
const PDFObject & globalDataObject = document - > getObject ( filterParamsDictionary - > get ( " JBIG2Globals " ) ) ;
if ( globalDataObject . isStream ( ) )
{
globalData = document - > getDecodedStream ( globalDataObject . getStream ( ) ) ;
}
}
PDFJBIG2Decoder decoder ( qMove ( data ) , qMove ( globalData ) , errorReporter ) ;
2019-10-27 15:52:50 +01:00
image . m_imageData = decoder . decode ( maskingType ) ;
2019-11-03 14:56:56 +01:00
image . m_imageData . setDecode ( ! decode . empty ( ) ? qMove ( decode ) : std : : vector < PDFReal > ( { 0.0 , 1.0 } ) ) ;
2019-06-15 14:29:49 +02:00
}
2019-10-05 15:11:53 +02:00
else if ( colorSpace | | isSoftMask )
2019-06-15 14:29:49 +02:00
{
// We treat data as binary maybe compressed stream (for example by Flate/LZW method), but data can also be not compressed.
const unsigned int components = static_cast < unsigned int > ( colorSpace - > getColorComponentCount ( ) ) ;
const unsigned int bitsPerComponent = static_cast < unsigned int > ( loader . readIntegerFromDictionary ( dictionary , " BitsPerComponent " , 8 ) ) ;
const unsigned int width = static_cast < unsigned int > ( loader . readIntegerFromDictionary ( dictionary , " Width " , 0 ) ) ;
const unsigned int height = static_cast < unsigned int > ( loader . readIntegerFromDictionary ( dictionary , " Height " , 0 ) ) ;
if ( bitsPerComponent < 1 | | bitsPerComponent > 32 )
{
throw PDFRendererException ( RenderErrorType : : Error , PDFTranslationContext : : tr ( " Invalid number of bits per component (%1) . " ).arg(bitsPerComponent)) ;
}
if ( width = = 0 | | height = = 0 )
{
throw PDFRendererException ( RenderErrorType : : Error , PDFTranslationContext : : tr ( " Invalid size of image (%1x%2) " ).arg(width).arg(height)) ;
}
// Calculate stride
const unsigned int stride = ( components * bitsPerComponent * width + 7 ) / 8 ;
QByteArray imageDataBuffer = document - > getDecodedStream ( stream ) ;
2019-10-05 15:11:53 +02:00
image . m_imageData = PDFImageData ( components , bitsPerComponent , width , height , stride , maskingType , qMove ( imageDataBuffer ) , qMove ( mask ) , qMove ( decode ) , qMove ( matte ) ) ;
2019-06-15 17:40:22 +02:00
}
else if ( imageMask )
{
2020-08-15 15:57:55 +02:00
// If ImageMask is set to true, then "BitsPerComponent" should have always value of 1.
// If this entry is not specified, then the value should be implicitly 1.
const unsigned int bitsPerComponent = static_cast < unsigned int > ( loader . readIntegerFromDictionary ( dictionary , " BitsPerComponent " , 1 ) ) ;
2019-06-15 17:40:22 +02:00
if ( bitsPerComponent ! = 1 )
{
throw PDFRendererException ( RenderErrorType : : Error , PDFTranslationContext : : tr ( " Invalid number bits of image mask (should be 1 bit instead of %1 bits) . " ).arg(bitsPerComponent)) ;
}
const unsigned int width = static_cast < unsigned int > ( loader . readIntegerFromDictionary ( dictionary , " Width " , 0 ) ) ;
const unsigned int height = static_cast < unsigned int > ( loader . readIntegerFromDictionary ( dictionary , " Height " , 0 ) ) ;
if ( width = = 0 | | height = = 0 )
{
throw PDFRendererException ( RenderErrorType : : Error , PDFTranslationContext : : tr ( " Invalid size of image (%1x%2) " ).arg(width).arg(height)) ;
}
// Calculate stride
const unsigned int stride = ( width + 7 ) / 8 ;
QByteArray imageDataBuffer = document - > getDecodedStream ( stream ) ;
2019-10-05 15:11:53 +02:00
image . m_imageData = PDFImageData ( 1 , bitsPerComponent , width , height , stride , maskingType , qMove ( imageDataBuffer ) , qMove ( mask ) , qMove ( decode ) , qMove ( matte ) ) ;
2019-06-15 14:29:49 +02:00
}
2019-05-07 18:21:22 +02:00
return image ;
}
2019-12-25 17:56:17 +01:00
QImage PDFImage : : getImage ( const PDFCMS * cms , PDFRenderErrorReporter * reporter ) const
2019-05-07 18:21:22 +02:00
{
2019-07-24 19:15:03 +02:00
const bool isImageMask = m_imageData . getMaskingType ( ) = = PDFImageData : : MaskingType : : ImageMask ;
if ( m_colorSpace & & ! isImageMask )
2019-05-07 18:21:22 +02:00
{
2019-12-25 17:56:17 +01:00
return m_colorSpace - > getImage ( m_imageData , m_softMask , cms , m_renderingIntent , reporter ) ;
2019-05-07 18:21:22 +02:00
}
2019-07-24 19:15:03 +02:00
else if ( isImageMask )
2019-06-15 17:40:22 +02:00
{
if ( m_imageData . getBitsPerComponent ( ) ! = 1 )
{
throw PDFRendererException ( RenderErrorType : : Error , PDFTranslationContext : : tr ( " Invalid number bits of image mask (should be 1 bit instead of %1 bits) . " ).arg(m_imageData.getBitsPerComponent())) ;
}
if ( m_imageData . getWidth ( ) = = 0 | | m_imageData . getHeight ( ) = = 0 )
{
throw PDFRendererException ( RenderErrorType : : Error , PDFTranslationContext : : tr ( " Invalid size of image (%1x%2) " ).arg(m_imageData.getWidth()).arg(m_imageData.getHeight())) ;
}
QImage image ( m_imageData . getWidth ( ) , m_imageData . getHeight ( ) , QImage : : Format_Alpha8 ) ;
const bool flip01 = ! m_imageData . getDecode ( ) . empty ( ) & & qFuzzyCompare ( m_imageData . getDecode ( ) . front ( ) , 1.0 ) ;
2019-09-15 16:50:34 +02:00
PDFBitReader reader ( & m_imageData . getData ( ) , m_imageData . getBitsPerComponent ( ) ) ;
2019-06-15 17:40:22 +02:00
for ( unsigned int i = 0 , rowCount = m_imageData . getHeight ( ) ; i < rowCount ; + + i )
{
reader . seek ( i * m_imageData . getStride ( ) ) ;
unsigned char * outputLine = image . scanLine ( i ) ;
for ( unsigned int j = 0 ; j < m_imageData . getWidth ( ) ; + + j )
{
const bool transparent = flip01 ! = static_cast < bool > ( reader . read ( ) ) ;
* outputLine + + = transparent ? 0x00 : 0xFF ;
}
}
return image ;
}
2019-05-07 18:21:22 +02:00
return QImage ( ) ;
}
OPJ_SIZE_T PDFJPEG2000ImageData : : read ( void * p_buffer , OPJ_SIZE_T p_nb_bytes , void * p_user_data )
{
PDFJPEG2000ImageData * data = reinterpret_cast < PDFJPEG2000ImageData * > ( p_user_data ) ;
// Remaining length
OPJ_OFF_T length = static_cast < OPJ_OFF_T > ( data - > byteArray - > size ( ) ) - data - > position ;
if ( length < 0 )
{
length = 0 ;
}
if ( length > static_cast < OPJ_OFF_T > ( p_nb_bytes ) )
{
length = static_cast < OPJ_OFF_T > ( p_nb_bytes ) ;
}
if ( length > 0 )
{
std : : memcpy ( p_buffer , data - > byteArray - > constData ( ) + data - > position , length ) ;
data - > position + = length ;
}
2019-05-10 19:48:52 +02:00
if ( length = = 0 )
{
return ( OPJ_SIZE_T ) - 1 ;
}
2019-05-07 18:21:22 +02:00
return length ;
}
OPJ_BOOL PDFJPEG2000ImageData : : seek ( OPJ_OFF_T p_nb_bytes , void * p_user_data )
{
PDFJPEG2000ImageData * data = reinterpret_cast < PDFJPEG2000ImageData * > ( p_user_data ) ;
if ( p_nb_bytes > = data - > byteArray - > size ( ) )
{
return OPJ_FALSE ;
}
data - > position = p_nb_bytes ;
return OPJ_TRUE ;
}
OPJ_OFF_T PDFJPEG2000ImageData : : skip ( OPJ_OFF_T p_nb_bytes , void * p_user_data )
{
PDFJPEG2000ImageData * data = reinterpret_cast < PDFJPEG2000ImageData * > ( p_user_data ) ;
// Remaining length
OPJ_OFF_T length = static_cast < OPJ_OFF_T > ( data - > byteArray - > size ( ) ) - data - > position ;
if ( length < 0 )
{
length = 0 ;
}
if ( length > static_cast < OPJ_OFF_T > ( p_nb_bytes ) )
{
length = static_cast < OPJ_OFF_T > ( p_nb_bytes ) ;
}
data - > position + = length ;
return length ;
}
2020-08-15 15:57:55 +02:00
PDFAlternateImage PDFAlternateImage : : parse ( const PDFObjectStorage * storage , PDFObject object )
{
PDFAlternateImage result ;
if ( const PDFDictionary * dictionary = storage - > getDictionaryFromObject ( object ) )
{
PDFDocumentDataLoaderDecorator loader ( storage ) ;
result . m_image = loader . readReferenceFromDictionary ( dictionary , " Image " ) ;
result . m_oc = loader . readReferenceFromDictionary ( dictionary , " OC " ) ;
result . m_defaultForPrinting = loader . readBooleanFromDictionary ( dictionary , " DefaultForPrinting " , false ) ;
}
return result ;
}
2019-10-12 18:10:25 +02:00
2019-05-07 18:21:22 +02:00
} // namespace pdf