pdfio/pdfio-object.c
Michael R Sweet 18853ca3d5
Increase token buffer to 256 bytes, to avoid overflow scenarios.
Add _pdfioTokenFlush to manually flush the token buffer.

Add more debug printfs.
2021-05-10 17:37:57 -04:00

262 lines
5.8 KiB
C
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

//
// PDF object functions for pdfio.
//
// Copyright © 2021 by Michael R Sweet.
//
// Licensed under Apache License v2.0. See the file "LICENSE" for more
// information.
//
//
// Include necessary headers...
//
#include "pdfio-private.h"
//
// 'pdfioObjClose()' - Close an object, writing any data as needed to the PDF
// file.
//
bool // O - `true` on success, `false` on failure
pdfioObjClose(pdfio_obj_t *obj) // I - Object
{
// TODO: Implement me
(void)obj;
return (false);
}
//
// 'pdfioObjCreateStream()' - Create an object (data) stream for writing.
//
pdfio_stream_t * // O - Stream or `NULL` on error
pdfioObjCreateStream(
pdfio_obj_t *obj, // I - Object
pdfio_filter_t filter) // I - Type of compression to apply
{
// TODO: Implement me
(void)obj;
(void)filter;
return (NULL);
}
//
// '_pdfioObjDelete()' - Free memory used by an object.
//
void
_pdfioObjDelete(pdfio_obj_t *obj) // I - Object
{
if (obj)
pdfioStreamClose(obj->stream);
free(obj);
}
//
// 'pdfioObjGetDict()' - Get the dictionary associated with an object.
//
pdfio_dict_t * // O - Dictionary or `NULL` on error
pdfioObjGetDict(pdfio_obj_t *obj) // I - Object
{
if (!obj)
return (NULL);
if (obj->value.type == PDFIO_VALTYPE_NONE)
_pdfioObjLoad(obj);
if (obj->value.type == PDFIO_VALTYPE_DICT)
return (obj->value.value.dict);
else
return (NULL);
}
//
// 'pdfioObjGetGeneration()' - Get the object's generation number.
//
unsigned short // O - Generation number (0 to 65535)
pdfioObjGetGeneration(pdfio_obj_t *obj) // I - Object
{
return (obj ? obj->generation : 0);
}
//
// 'pdfioObjGetLength()' - Get the length of the object's (data) stream.
//
size_t // O - Length in bytes or `0` for none
pdfioObjGetLength(pdfio_obj_t *obj) // I - Object
{
size_t length; // Length of stream
pdfio_obj_t *lenobj; // Length object
// Range check input...
if (!obj || !obj->stream_offset || obj->value.type != PDFIO_VALTYPE_DICT)
return (0);
// Try getting the length, directly or indirectly
if ((length = (size_t)pdfioDictGetNumber(obj->value.value.dict, "Length")) > 0)
return (length);
if ((lenobj = pdfioDictGetObject(obj->value.value.dict, "Length")) == NULL)
{
_pdfioFileError(obj->pdf, "Unable to get length of stream.");
return (0);
}
if (lenobj->value.type == PDFIO_VALTYPE_NONE)
_pdfioObjLoad(lenobj);
if (lenobj->value.type != PDFIO_VALTYPE_NUMBER || lenobj->value.value.number <= 0.0f)
{
_pdfioFileError(obj->pdf, "Unable to get length of stream.");
return (0);
}
return ((size_t)lenobj->value.value.number);
}
//
// 'pdfioObjGetNumber()' - Get the object's number.
//
size_t // O - Object number (1 to 9999999999)
pdfioObjGetNumber(pdfio_obj_t *obj) // I - Object
{
return (obj ? obj->number : 0);
}
//
// 'pdfioObjGetType()' - Get an object's type.
//
const char * // O - Object type
pdfioObjGetType(pdfio_obj_t *obj) // I - Object
{
pdfio_dict_t *dict; // Object dictionary
if ((dict = pdfioObjGetDict(obj)) == NULL)
return (NULL);
else
return (pdfioDictGetName(dict, "Type"));
}
//
// '_pdfioObjLoad()' - Load an object dictionary/value.
//
bool // O - `true` on success, `false` otherwise
_pdfioObjLoad(pdfio_obj_t *obj) // I - Object
{
char line[1024], // Line from file
*ptr; // Pointer into line
_pdfio_token_t tb; // Token buffer/stack
PDFIO_DEBUG("_pdfioObjLoad(obj=%p(%lu)), offset=%lu\n", obj, (unsigned long)obj->number, (unsigned long)obj->offset);
// Seek to the start of the object and read its header...
if (_pdfioFileSeek(obj->pdf, obj->offset, SEEK_SET) != obj->offset)
{
_pdfioFileError(obj->pdf, "Unable to seek to object %lu.", (unsigned long)obj->number);
return (false);
}
if (!_pdfioFileGets(obj->pdf, line, sizeof(line)))
{
_pdfioFileError(obj->pdf, "Unable to read header for object %lu.", (unsigned long)obj->number);
return (false);
}
if (strtoimax(line, &ptr, 10) != (intmax_t)obj->number)
{
_pdfioFileError(obj->pdf, "Bad header for object %lu.", (unsigned long)obj->number);
return (false);
}
if (strtol(ptr, &ptr, 10) != (long)obj->generation)
{
_pdfioFileError(obj->pdf, "Bad header for object %lu.", (unsigned long)obj->number);
return (false);
}
while (isspace(*ptr & 255))
ptr ++;
if (strcmp(ptr, "obj"))
{
_pdfioFileError(obj->pdf, "Bad header for object %lu.", (unsigned long)obj->number);
return (false);
}
// Then grab the object value...
_pdfioTokenInit(&tb, obj->pdf, (_pdfio_tconsume_cb_t)_pdfioFileConsume, (_pdfio_tpeek_cb_t)_pdfioFilePeek, obj->pdf);
if (!_pdfioValueRead(obj->pdf, &tb, &obj->value))
{
_pdfioFileError(obj->pdf, "Unable to read value for object %lu.", (unsigned long)obj->number);
return (false);
}
// Now see if there is an associated stream...
if (!_pdfioTokenGet(&tb, line, sizeof(line)))
{
_pdfioFileError(obj->pdf, "Early end-of-file for object %lu.", (unsigned long)obj->number);
return (false);
}
_pdfioTokenFlush(&tb);
if (!strcmp(line, "stream"))
{
// Yes, save its location...
obj->stream_offset = _pdfioFileTell(obj->pdf);
}
return (true);
}
//
// 'pdfioObjOpenStream()' - Open an object's (data) stream for reading.
//
pdfio_stream_t * // O - Stream or `NULL` on error
pdfioObjOpenStream(pdfio_obj_t *obj, // I - Object
bool decode) // I - Decode/decompress data?
{
// Range check input...
if (!obj)
return (NULL);
// Make sure we've loaded the object dictionary...
if (!obj->value.type)
{
if (!_pdfioObjLoad(obj))
return (NULL);
}
// No stream if there is no dict or offset to a stream...
if (obj->value.type != PDFIO_VALTYPE_DICT || !obj->stream_offset)
return (NULL);
// Open the stream...
return (_pdfioStreamOpen(obj, decode));
}