Finalize md2pdf example docos.

This commit is contained in:
Michael R Sweet 2024-12-22 12:09:03 -05:00
parent 5dc68f3285
commit aa91b141a8
No known key found for this signature in database
GPG Key ID: BE67C75EC81F3244
4 changed files with 1948 additions and 649 deletions

View File

@ -1,9 +1,9 @@
.TH pdfio 3 "pdf read/write library" "2024-12-19" "pdf read/write library" .TH pdfio 3 "pdf read/write library" "2024-12-22" "pdf read/write library"
.SH NAME .SH NAME
pdfio \- pdf read/write library pdfio \- pdf read/write library
.SH Introduction .SH Introduction
.PP .PP
PDFio is a simple C library for reading and writing PDF files. The primary goals of pdfio are: PDFio is a simple C library for reading and writing PDF files. The primary goals of PDFio are:
.IP \(bu 5 .IP \(bu 5
.PP .PP
Read and write any version of PDF file Read and write any version of PDF file
@ -305,8 +305,8 @@ You open an existing PDF file using the pdfioFileOpen function:
.nf .nf
pdfio_file_t *pdf = pdfio_file_t *pdf =
pdfioFileOpen("myinputfile.pdf", password_cb, password_data, pdfioFileOpen("myinputfile.pdf", password_cb, password_data, error_cb,
error_cb, error_data); error_data);
.fi .fi
.PP .PP
where the five arguments to the function are the filename ("myinputfile.pdf"), an optional password callback function (password_cb) and data pointer value (password_data), and an optional error callback function (error_cb) and data pointer value (error_data). The password callback is called for encrypted PDF files that are not using the default password, for example: where the five arguments to the function are the filename ("myinputfile.pdf"), an optional password callback function (password_cb) and data pointer value (password_data), and an optional error callback function (error_cb) and data pointer value (error_data). The password callback is called for encrypted PDF files that are not using the default password, for example:
@ -454,8 +454,7 @@ You create a new PDF file using the pdfioFileCreate function:
pdfio_rect_t media_box = { 0.0, 0.0, 612.0, 792.0 }; // US Letter pdfio_rect_t media_box = { 0.0, 0.0, 612.0, 792.0 }; // US Letter
pdfio_rect_t crop_box = { 36.0, 36.0, 576.0, 756.0 }; // w/0.5" margins pdfio_rect_t crop_box = { 36.0, 36.0, 576.0, 756.0 }; // w/0.5" margins
pdfio_file_t *pdf = pdfioFileCreate("myoutputfile.pdf", "2.0", pdfio_file_t *pdf = pdfioFileCreate("myoutputfile.pdf", "2.0", &media_box, &crop_box,
&media_box, &crop_box,
error_cb, error_data); error_cb, error_data);
.fi .fi
.PP .PP
@ -467,9 +466,8 @@ Alternately you can stream a PDF file using the pdfioFileCreateOutput function:
pdfio_rect_t media_box = { 0.0, 0.0, 612.0, 792.0 }; // US Letter pdfio_rect_t media_box = { 0.0, 0.0, 612.0, 792.0 }; // US Letter
pdfio_rect_t crop_box = { 36.0, 36.0, 576.0, 756.0 }; // w/0.5" margins pdfio_rect_t crop_box = { 36.0, 36.0, 576.0, 756.0 }; // w/0.5" margins
pdfio_file_t *pdf = pdfioFileCreateOutput(output_cb, output_ctx, "2.0", pdfio_file_t *pdf = pdfioFileCreateOutput(output_cb, output_ctx, "2.0", &media_box,
&media_box, &crop_box, &crop_box, error_cb, error_data);
error_cb, error_data);
.fi .fi
.PP .PP
Once the file is created, use the pdfioFileCreateObj, pdfioFileCreatePage, and pdfioPageCopy functions to create objects and pages in the file. Once the file is created, use the pdfioFileCreateObj, pdfioFileCreatePage, and pdfioPageCopy functions to create objects and pages in the file.
@ -756,10 +754,9 @@ PDF supports images with many different color spaces and bit depths with optiona
pdfio_file_t *pdf = pdfioFileCreate(...); pdfio_file_t *pdf = pdfioFileCreate(...);
unsigned char data[1024 * 1024 * 4]; // 1024x1024 RGBA image data unsigned char data[1024 * 1024 * 4]; // 1024x1024 RGBA image data
pdfio_obj_t *img = pdfio_obj_t *img =
pdfioFileCreateImageObjFromData(pdf, data, /*width*/1024, pdfioFileCreateImageObjFromData(pdf, data, /*width*/1024, /*height*/1024,
/*height*/1024, /*num_colors*/3, /*num_colors*/3, /*color_data*/NULL,
/*color_data*/NULL, /*alpha*/true, /*alpha*/true, /*interpolate*/false);
/*interpolate*/false);
.fi .fi
.PP .PP
will create an object for a 1024x1024 RGBA image in memory, using the default color space for 3 colors ("DeviceRGB"). We can use one of the color space functions to use a specific color space for this image, for example: will create an object for a 1024x1024 RGBA image in memory, using the default color space for 3 colors ("DeviceRGB"). We can use one of the color space functions to use a specific color space for this image, for example:
@ -770,17 +767,14 @@ will create an object for a 1024x1024 RGBA image in memory, using the default co
// Create an AdobeRGB color array // Create an AdobeRGB color array
pdfio_array_t *adobe_rgb = pdfio_array_t *adobe_rgb =
pdfioArrayCreateColorFromMatrix(pdf, 3, pdfioAdobeRGBGamma, pdfioArrayCreateColorFromMatrix(pdf, 3, pdfioAdobeRGBGamma,
pdfioAdobeRGBMatrix, pdfioAdobeRGBMatrix, pdfioAdobeRGBWhitePoint);
pdfioAdobeRGBWhitePoint);
// Create a 1024x1024 RGBA image using AdobeRGB // Create a 1024x1024 RGBA image using AdobeRGB
unsigned char data[1024 * 1024 * 4]; // 1024x1024 RGBA image data unsigned char data[1024 * 1024 * 4]; // 1024x1024 RGBA image data
pdfio_obj_t *img = pdfio_obj_t *img =
pdfioFileCreateImageObjFromData(pdf, data, /*width*/1024, pdfioFileCreateImageObjFromData(pdf, data, /*width*/1024, /*height*/1024,
/*height*/1024, /*num_colors*/3, /*num_colors*/3, /*color_data*/adobe_rgb,
/*color_data*/adobe_rgb, /*alpha*/true, /*interpolate*/false);
/*alpha*/true,
/*interpolate*/false);
.fi .fi
.PP .PP
The "interpolate" argument specifies whether the colors in the image should be smoothed/interpolated when scaling. This is most useful for photographs but should be false for screenshot and barcode images. The "interpolate" argument specifies whether the colors in the image should be smoothed/interpolated when scaling. This is most useful for photographs but should be false for screenshot and barcode images.
@ -790,8 +784,7 @@ If you have a JPEG or PNG file, use the pdfioFileCreateImageObjFromFile function
pdfio_file_t *pdf = pdfioFileCreate(...); pdfio_file_t *pdf = pdfioFileCreate(...);
pdfio_obj_t *img = pdfio_obj_t *img =
pdfioFileCreateImageObjFromFile(pdf, "myphoto.jpg", pdfioFileCreateImageObjFromFile(pdf, "myphoto.jpg", /*interpolate*/true);
/*interpolate*/true);
.fi .fi
.PP .PP
Note: Currently pdfioFileCreateImageObjFromFile does not support 12 bit JPEG files or PNG files with an alpha channel. Note: Currently pdfioFileCreateImageObjFromFile does not support 12 bit JPEG files or PNG files with an alpha channel.
@ -1065,9 +1058,8 @@ The pdfioinfo.c example program opens a PDF file and prints the title, author, c
filename = argv[1]; filename = argv[1];
// Open the PDF file with the default callbacks... // Open the PDF file with the default callbacks...
pdf = pdfioFileOpen(filename, /*password_cb*/NULL, pdf = pdfioFileOpen(filename, /*password_cb*/NULL, /*password_cbdata*/NULL,
/*password_cbdata*/NULL, /*error_cb*/NULL, /*error_cb*/NULL, /*error_cbdata*/NULL);
/*error_cbdata*/NULL);
if (pdf == NULL) if (pdf == NULL)
return (1); return (1);
@ -1116,9 +1108,8 @@ The image2pdf.c example code creates a PDF file containing a JPEG or PNG image f
// Create the PDF file... // Create the PDF file...
pdf = pdfioFileCreate(pdfname, /*version*/NULL, /*media_box*/NULL, pdf = pdfioFileCreate(pdfname, /*version*/NULL, /*media_box*/NULL, /*crop_box*/NULL,
/*crop_box*/NULL, /*error_cb*/NULL, /*error_cb*/NULL, /*error_cbdata*/NULL);
/*error_cbdata*/NULL);
if (!pdf) if (!pdf)
return (false); return (false);
@ -1152,9 +1143,9 @@ The image2pdf.c example code creates a PDF file containing a JPEG or PNG image f
width = pdfioImageGetWidth(image); width = pdfioImageGetWidth(image);
height = pdfioImageGetHeight(image); height = pdfioImageGetHeight(image);
// Default media_box is "universal" 595.28x792 points (8.27x11in or // Default media_box is "universal" 595.28x792 points (8.27x11in or 210x279mm).
// 210x279mm). Use margins of 36 points (0.5in or 12.7mm) with another // Use margins of 36 points (0.5in or 12.7mm) with another 36 points for the
// 36 points for the caption underneath... // caption underneath...
swidth = 595.28 \- 72.0; swidth = 595.28 \- 72.0;
sheight = swidth * height / width; sheight = swidth * height / width;
if (sheight > (792.0 \- 36.0 \- 72.0)) if (sheight > (792.0 \- 36.0 \- 72.0))
@ -1171,8 +1162,8 @@ The image2pdf.c example code creates a PDF file containing a JPEG or PNG image f
// Draw the caption in black... // Draw the caption in black...
pdfioContentSetFillColorDeviceGray(page, 0.0); pdfioContentSetFillColorDeviceGray(page, 0.0);
// Compute the starting point for the text \- Courier is monospaced // Compute the starting point for the text \- Courier is monospaced with a
// with a nominal width of 0.6 times the text height... // nominal width of 0.6 times the text height...
tx = 0.5 * (595.28 \- 18.0 * 0.6 * strlen(caption)); tx = 0.5 * (595.28 \- 18.0 * 0.6 * strlen(caption));
// Position and draw the caption underneath... // Position and draw the caption underneath...
@ -1247,8 +1238,7 @@ The first thing you need to do is prepare the barcode string to use with the fon
The main function does the rest of the work. The barcode font is imported using the pdfioFileCreateFontObjFromFile function. We pass false for the "unicode" argument since we just want the (default) ASCII encoding: The main function does the rest of the work. The barcode font is imported using the pdfioFileCreateFontObjFromFile function. We pass false for the "unicode" argument since we just want the (default) ASCII encoding:
.nf .nf
barcode_font = pdfioFileCreateFontObjFromFile(pdf, "code128.ttf", barcode_font = pdfioFileCreateFontObjFromFile(pdf, "code128.ttf", /*unicode*/false);
/*unicode*/false);
.fi .fi
.PP .PP
Since barcodes usually have the number or text represented by the barcode printed underneath it, we also need a regular text font, for which we can choose one of the standard 14 PostScript base fonts using the pdfioFIleCreateFontObjFromBase function: Since barcodes usually have the number or text represented by the barcode printed underneath it, we also need a regular text font, for which we can choose one of the standard 14 PostScript base fonts using the pdfioFIleCreateFontObjFromBase function:
@ -1278,8 +1268,7 @@ Once we have these fonts we can measure the barcode and regular text labels usin
if (text && text_font) if (text && text_font)
{ {
text_height = 9.0; text_height = 9.0;
text_width = pdfioContentTextMeasure(text_font, text, text_width = pdfioContentTextMeasure(text_font, text, text_height);
text_height);
} }
// Compute the size of the PDF page... // Compute the size of the PDF page...
@ -1287,8 +1276,7 @@ Once we have these fonts we can measure the barcode and regular text labels usin
media_box.x1 = 0.0; media_box.x1 = 0.0;
media_box.y1 = 0.0; media_box.y1 = 0.0;
media_box.x2 = (barcode_width > text_width ? media_box.x2 = (barcode_width > text_width ? barcode_width : text_width) + 18.0;
barcode_width : text_width) + 18.0;
media_box.y2 = barcode_height + text_height + 18.0; media_box.y2 = barcode_height + text_height + 18.0;
.fi .fi
.PP .PP
@ -1336,8 +1324,789 @@ With the barcode font called "B128" and the text font called "TEXT", we can use
.PP .PP
Markdown is a simple plain text format that supports things like headings, links, character styles, tables, and embedded images. The md2pdf.c example code uses the mmd library to convert markdown to a PDF file that can be distributed. Markdown is a simple plain text format that supports things like headings, links, character styles, tables, and embedded images. The md2pdf.c example code uses the mmd library to convert markdown to a PDF file that can be distributed.
.PP .PP
Note: The md2pdf example is by far the most complex example code included with PDFio and shows how to layout text, add headers and footers, add links, embed images, and format tables. Note: The md2pdf example is by far the most complex example code included with PDFio and shows how to layout text, add headers and footers, add links, embed images, format tables, and add an outline (table of contents) for navigation.
.PP
Managing Document State
.PP
The md2pdf program needs to maintain three sets of state \- one for the markdown document which is represented by nodes of type mmd_t and the others for the PDF document and current PDF page which are contained in the docdata_t structure:
.nf
typedef struct docdata_s // Document formatting data
{
// State for the whole document
pdfio_file_t *pdf; // PDF file
pdfio_rect_t media_box; // Media (page) box
pdfio_rect_t crop_box; // Crop box (for margins)
pdfio_rect_t art_box; // Art box (for markdown content)
pdfio_obj_t *fonts[DOCFONT_MAX]; // Embedded fonts
double font_space; // Unit width of a space
size_t num_images; // Number of embedded images
docimage_t images[DOCIMAGE_MAX]; // Embedded images
const char *title; // Document title
char *heading; // Current document heading
size_t num_actions; // Number of actions for this document
docaction_t actions[DOCACTION_MAX]; // Actions for this document
size_t num_targets; // Number of targets for this document
doctarget_t targets[DOCTARGET_MAX]; // Targets for this document
size_t num_toc; // Number of table\-of\-contents entries
doctoc_t toc[DOCTOC_MAX]; // Table\-of\-contents entries
// State for the current page
pdfio_stream_t *st; // Current page stream
double y; // Current position on page
docfont_t font; // Current font
double fsize; // Current font size
doccolor_t color; // Current color
pdfio_array_t *annots_array; // Annotations array (for links)
pdfio_obj_t *annots_obj; // Annotations object (for links)
size_t num_links; // Number of links for this page
doclink_t links[DOCLINK_MAX]; // Links for this page
} docdata_t;
.fi
.PP
Document State
.PP
The output is fixed to the "universal" media size (the intersection of US Letter and ISO A4) with 1/2 inch margins \- the PAGE_ constants can be changed to select a different size or margins. The media_box member contains the "MediaBox" rectangle for the PDF pages, while the crop_box and art_box members contain the "CropBox" and "ArtBox" values, respectively.
.PP
Four embedded fonts are used:
.IP \(bu 5
.PP
DOCFONT_REGULAR: the default font used for text,
.IP \(bu 5
.PP
DOCFONT_BOLD: a boldface font used for heading and strong text,
.IP \(bu 5
.PP
DOCFONT_ITALIC: an italic/oblique font used for emphasized text, and
.IP \(bu 5
.PP
DOCFONT_MONOSPACE: a fixed\-width font used for code.
.PP
By default the code uses the base PostScript fonts Helvetica, Helvetica\-Bold, Helvetica\-Oblique, and Courier. The USE_TRUETYPE define can be used to replace these with the Roboto TrueType fonts.
.PP
Embedded JPEG and PNG images are copied into the PDF document, with the images array containing the list of the images and their objects.
.PP
The title member contains the document title, while the heading member contains the current heading text.
.PP
The actions array contains a list of action dictionaries for interior document links that need to be resolved, while the targets array keeps track of the location of the headings in the PDF document.
.PP
The toc array contains a list of headings and is used to construct the PDF outlines dictionaries/objects, which provides a table of contents for navigation in most PDF readers.
.PP
Page State
.PP
The st member provides the stream for the current page content. The color, font, fsize, and y members provide the current graphics state on the page.
.PP
The annots_array, annots_obj, num_links, and links members contain a list of hyperlinks on the current page.
.PP
Creating Pages
.PP
The new_page function is used to start a new page. Aside from creating the new page object and stream, it adds a standard header and footer to the page. It starts by closing the current page if it is open:
.nf
// Close the current page...
if (dd\->st)
{
pdfioStreamClose(dd\->st);
add_links(dd);
}
.fi
.PP
The new page needs a dictionary containing any link annotations, the media and art boxes, the four fonts, and any images:
.nf
// Prep the new page...
page_dict = pdfioDictCreate(dd\->pdf);
dd\->annots_array = pdfioArrayCreate(dd\->pdf);
dd\->annots_obj = pdfioFileCreateArrayObj(dd\->pdf, dd\->annots_array);
pdfioDictSetObj(page_dict, "Annots", dd\->annots_obj);
pdfioDictSetRect(page_dict, "MediaBox", &dd\->media_box);
pdfioDictSetRect(page_dict, "ArtBox", &dd\->art_box);
for (fontface = DOCFONT_REGULAR; fontface < DOCFONT_MAX; fontface ++)
pdfioPageDictAddFont(page_dict, docfont_names[fontface], dd\->fonts[fontface]);
for (i = 0; i < dd\->num_images; i ++)
pdfioPageDictAddImage(page_dict, pdfioStringCreatef(dd\->pdf, "I%u", (unsigned)i),
dd\->images[i].obj);
.fi
.PP
Once the page dictionary is initialized, we create a new page and initialize the current graphics state:
.nf
dd\->st = pdfioFileCreatePage(dd\->pdf, page_dict);
dd\->color = DOCCOLOR_BLACK;
dd\->font = DOCFONT_MAX;
dd\->fsize = 0.0;
dd\->y = dd\->art_box.y2;
.fi
.PP
The header consists of a dark gray separating line and the document title. We don't show the header on the first page:
.nf
// Add header/footer text
set_color(dd, DOCCOLOR_GRAY);
set_font(dd, DOCFONT_REGULAR, SIZE_HEADFOOT);
if (pdfioFileGetNumPages(dd\->pdf) > 1 && dd\->title)
{
// Show title in header...
width = pdfioContentTextMeasure(dd\->fonts[DOCFONT_REGULAR], dd\->title,
SIZE_HEADFOOT);
pdfioContentTextBegin(dd\->st);
pdfioContentTextMoveTo(dd\->st,
dd\->crop_box.x1 + 0.5 * (dd\->crop_box.x2 \-
dd\->crop_box.x1 \- width),
dd\->crop_box.y2 \- SIZE_HEADFOOT);
pdfioContentTextShow(dd\->st, UNICODE_VALUE, dd\->title);
pdfioContentTextEnd(dd\->st);
pdfioContentPathMoveTo(dd\->st, dd\->crop_box.x1,
dd\->crop_box.y2 \- 2 * SIZE_HEADFOOT * LINE_HEIGHT +
SIZE_HEADFOOT);
pdfioContentPathLineTo(dd\->st, dd\->crop_box.x2,
dd\->crop_box.y2 \- 2 * SIZE_HEADFOOT * LINE_HEIGHT +
SIZE_HEADFOOT);
pdfioContentStroke(dd\->st);
}
.fi
.PP
The footer contains the same dark gray separating line with the current heading and page number on opposite sides. The page number is always positioned on the outer edge for a two\-sided print \- right justified on odd numbered pages and left justified on even numbered pages:
.nf
// Show page number and current heading...
pdfioContentPathMoveTo(dd\->st, dd\->crop_box.x1,
dd\->crop_box.y1 + SIZE_HEADFOOT * LINE_HEIGHT);
pdfioContentPathLineTo(dd\->st, dd\->crop_box.x2,
dd\->crop_box.y1 + SIZE_HEADFOOT * LINE_HEIGHT);
pdfioContentStroke(dd\->st);
pdfioContentTextBegin(dd\->st);
snprintf(temp, sizeof(temp), "%u", (unsigned)pdfioFileGetNumPages(dd\->pdf));
if (pdfioFileGetNumPages(dd\->pdf) & 1)
{
// Page number on right...
width = pdfioContentTextMeasure(dd\->fonts[DOCFONT_REGULAR], temp, SIZE_HEADFOOT);
pdfioContentTextMoveTo(dd\->st, dd\->crop_box.x2 \- width, dd\->crop_box.y1);
}
else
{
// Page number on left...
pdfioContentTextMoveTo(dd\->st, dd\->crop_box.x1, dd\->crop_box.y1);
}
pdfioContentTextShow(dd\->st, UNICODE_VALUE, temp);
pdfioContentTextEnd(dd\->st);
if (dd\->heading)
{
pdfioContentTextBegin(dd\->st);
if (pdfioFileGetNumPages(dd\->pdf) & 1)
{
// Current heading on left...
pdfioContentTextMoveTo(dd\->st, dd\->crop_box.x1, dd\->crop_box.y1);
}
else
{
width = pdfioContentTextMeasure(dd\->fonts[DOCFONT_REGULAR], dd\->heading,
SIZE_HEADFOOT);
pdfioContentTextMoveTo(dd\->st, dd\->crop_box.x2 \- width, dd\->crop_box.y1);
}
pdfioContentTextShow(dd\->st, UNICODE_VALUE, dd\->heading);
pdfioContentTextEnd(dd\->st);
}
.fi
.PP
Formatting the Markdown Document
.PP
Four functions handle the formatting of the markdown document:
.IP \(bu 5
.PP
format_block formats a single paragraph, heading, or table cell,
.IP \(bu 5
.PP
format_code: formats a block of code,
.IP \(bu 5
.PP
format_doc: formats the document as a whole, and
.IP \(bu 5
.PP
format_table: formats a table.
.PP
Formatted content is organized into arrays of linefrag_t and tablerow_t structures for a line of content or row of table cells, respectively.
.PP
High\-Level Formatting
.PP
The format_doc function iterates over the block nodes in the markdown document. We map a "thematic break" (horizontal rule) to a page break, which is implemented by moving the current vertical position to the bottom of the page:
.nf
case MMD_TYPE_THEMATIC_BREAK :
// Force a page break
dd\->y = dd\->art_box.y1;
break;
.fi
.PP
A block quote is indented and uses the italic font by default:
.nf
case MMD_TYPE_BLOCK_QUOTE :
format_doc(dd, current, DOCFONT_ITALIC, left + BQ_PADDING, right \- BQ_PADDING);
break;
.fi
.PP
Lists have a leading blank line and are indented:
.nf
case MMD_TYPE_ORDERED_LIST :
case MMD_TYPE_UNORDERED_LIST :
if (dd\->st)
dd\->y \-= SIZE_BODY * LINE_HEIGHT;
format_doc(dd, current, deffont, left + LIST_PADDING, right);
break;
.fi
.PP
List items do not have a leading blank line and make use of leader text that is shown in front of the list text. The leader text is either the current item number or a bullet, which then is directly formatted using the format_block function:
.nf
case MMD_TYPE_LIST_ITEM :
if (doctype == MMD_TYPE_ORDERED_LIST)
{
snprintf(leader, sizeof(leader), "%d. ", i);
format_block(dd, current, deffont, SIZE_BODY, left, right, leader);
}
else
{
format_block(dd, current, deffont, SIZE_BODY, left, right, /*leader*/"• ");
}
break;
.fi
.PP
Paragraphs have a leading blank line and are likewise directly formatted:
.nf
case MMD_TYPE_PARAGRAPH :
// Add a blank line before the paragraph...
dd\->y \-= SIZE_BODY * LINE_HEIGHT;
// Format the paragraph...
format_block(dd, current, deffont, SIZE_BODY, left, right, /*leader*/NULL);
break;
.fi
.PP
Tables have a leading blank line and are formatted using the format_table function:
.nf
case MMD_TYPE_TABLE :
// Add a blank line before the paragraph...
dd\->y \-= SIZE_BODY * LINE_HEIGHT;
// Format the table...
format_table(dd, current, left, right);
break;
.fi
.PP
Code blocks have a leading blank line, are indented slightly (to account for the padded background), and are formatted using the format_code function:
.nf
case MMD_TYPE_CODE_BLOCK :
// Add a blank line before the code block...
dd\->y \-= SIZE_BODY * LINE_HEIGHT;
// Format the code block...
format_code(dd, current, left + CODE_PADDING, right \- CODE_PADDING);
break;
.fi
.PP
Headings get some extra processing. First, the current heading is remembered in the docdata_t structure so it can be used in the page footer:
.nf
case MMD_TYPE_HEADING_1 :
case MMD_TYPE_HEADING_2 :
case MMD_TYPE_HEADING_3 :
case MMD_TYPE_HEADING_4 :
case MMD_TYPE_HEADING_5 :
case MMD_TYPE_HEADING_6 :
// Update the current heading
free(dd\->heading);
dd\->heading = mmdCopyAllText(current);
.fi
.PP
Then we add a blank line and format the heading with the boldface font at a larger size using the format_block function:
.nf
// Add a blank line before the heading...
dd\->y \-= heading_sizes[curtype \- MMD_TYPE_HEADING_1] * LINE_HEIGHT;
// Format the heading...
format_block(dd, current, DOCFONT_BOLD,
heading_sizes[curtype \- MMD_TYPE_HEADING_1], left, right,
/*leader*/NULL);
.fi
.PP
Once the heading is formatted, we record it in the toc array as a PDF outline item object/dictionary:
.nf
// Add the heading to the table\-of\-contents...
if (dd\->num_toc < DOCTOC_MAX)
{
doctoc_t *t = dd\->toc + dd\->num_toc;
// New TOC
pdfio_array_t *dest; // Destination array
t\->level = curtype \- MMD_TYPE_HEADING_1;
t\->dict = pdfioDictCreate(dd\->pdf);
t\->obj = pdfioFileCreateObj(dd\->pdf, t\->dict);
dest = pdfioArrayCreate(dd\->pdf);
pdfioArrayAppendObj(dest,
pdfioFileGetPage(dd\->pdf, pdfioFileGetNumPages(dd\->pdf) \- 1));
pdfioArrayAppendName(dest, "XYZ");
pdfioArrayAppendNumber(dest, PAGE_LEFT);
pdfioArrayAppendNumber(dest,
dd\->y + heading_sizes[curtype \- MMD_TYPE_HEADING_1] * LINE_HEIGHT);
pdfioArrayAppendNumber(dest, 0.0);
pdfioDictSetArray(t\->dict, "Dest", dest);
pdfioDictSetString(t\->dict, "Title", pdfioStringCreate(dd\->pdf, dd\->heading));
dd\->num_toc ++;
}
.fi
.PP
Finally, we also save the heading's target name and its location in the targets array to allow interior links to work:
.nf
// Add the heading to the list of link targets...
if (dd\->num_targets < DOCTARGET_MAX)
{
doctarget_t *t = dd\->targets + dd\->num_targets;
// New target
make_target_name(t\->name, dd\->heading, sizeof(t\->name));
t\->page = pdfioFileGetNumPages(dd\->pdf) \- 1;
t\->y = dd\->y + heading_sizes[curtype \- MMD_TYPE_HEADING_1] * LINE_HEIGHT;
dd\->num_targets ++;
}
break;
.fi
.PP
Formatting Paragraphs, Headings, List Items, and Table Cells
.PP
Paragraphs, headings, list items, and table cells all use the same basic formatting algorithm. Text, checkboxes, and images are collected until the nodes in the current block are used up or the content reaches the right margin.
.PP
In order to keep adjacent blocks of text together, the formatting algorithm makes sure that at least 3 lines of text can fit before the bottom edge of the page:
.nf
if (mmdGetNextSibling(block))
need_bottom = 3.0 * SIZE_BODY * LINE_HEIGHT;
else
need_bottom = 0.0;
.fi
.PP
Leader text (used for list items) is right justified to the left margin and becomes the first fragment on the line when present.
.nf
if (leader)
{
// Add leader text on first line...
frags[0].type = MMD_TYPE_NORMAL_TEXT;
frags[0].width = pdfioContentTextMeasure(dd\->fonts[deffont], leader, fsize);
frags[0].height = fsize;
frags[0].x = left \- frags[0].width;
frags[0].imagenum = 0;
frags[0].text = leader;
frags[0].url = NULL;
frags[0].ws = false;
frags[0].font = deffont;
frags[0].color = DOCCOLOR_BLACK;
num_frags = 1;
lineheight = fsize * LINE_HEIGHT;
}
else
{
// No leader text...
num_frags = 0;
lineheight = 0.0;
}
frag = frags + num_frags;
.fi
.PP
If the current content fragment won't fit, we call render_line to draw what we have, adjusting the left margin as needed for table cells:
.nf
// See if this node will fit on the current line...
if ((num_frags > 0 && (x + width + wswidth) >= right) || num_frags == LINEFRAG_MAX)
{
// No, render this line and start over...
if (blocktype == MMD_TYPE_TABLE_HEADER_CELL ||
blocktype == MMD_TYPE_TABLE_BODY_CELL_CENTER)
margin_left = 0.5 * (right \- x);
else if (blocktype == MMD_TYPE_TABLE_BODY_CELL_RIGHT)
margin_left = right \- x;
else
margin_left = 0.0;
render_line(dd, margin_left, need_bottom, lineheight, num_frags, frags);
num_frags = 0;
frag = frags;
x = left;
lineheight = 0.0;
need_bottom = 0.0;
.fi
.PP
Block quotes (blocks use a default font of italic) have an orange bar to the left of the block:
.nf
if (deffont == DOCFONT_ITALIC)
{
// Add an orange bar to the left of block quotes...
set_color(dd, DOCCOLOR_ORANGE);
pdfioContentSave(dd\->st);
pdfioContentSetLineWidth(dd\->st, 3.0);
pdfioContentPathMoveTo(dd\->st, left \- 6.0, dd\->y \- (LINE_HEIGHT \- 1.0) * fsize);
pdfioContentPathLineTo(dd\->st, left \- 6.0, dd\->y + fsize);
pdfioContentStroke(dd\->st);
pdfioContentRestore(dd\->st);
}
.fi
.PP
Finally, we add the current content fragment to the array:
.nf
// Add the current node to the fragment list
if (num_frags == 0)
{
// No leading whitespace at the start of the line
ws = false;
wswidth = 0.0;
}
frag\->type = type;
frag\->x = x;
frag\->width = width + wswidth;
frag\->height = text ? fsize : height;
frag\->imagenum = imagenum;
frag\->text = text;
frag\->url = url;
frag\->ws = ws;
frag\->font = font;
frag\->color = color;
num_frags ++;
frag ++;
x += width + wswidth;
if (height > lineheight)
lineheight = height;
.fi
.PP
Formatting Code Blocks
.PP
Code blocks consist of one or more lines of plain monospaced text. We draw a light gray background behind each line with a small bit of padding at the top and bottom:
.nf
// Draw the top padding...
set_color(dd, DOCCOLOR_LTGRAY);
pdfioContentPathRect(dd\->st, left \- CODE_PADDING, dd\->y + SIZE_CODEBLOCK,
right \- left + 2.0 * CODE_PADDING, CODE_PADDING);
pdfioContentFillAndStroke(dd\->st, false);
// Start a code text block...
set_font(dd, DOCFONT_MONOSPACE, SIZE_CODEBLOCK);
pdfioContentTextBegin(dd\->st);
pdfioContentTextMoveTo(dd\->st, left, dd\->y);
for (code = mmdGetFirstChild(block); code; code = mmdGetNextSibling(code))
{
set_color(dd, DOCCOLOR_LTGRAY);
pdfioContentPathRect(dd\->st, left \- CODE_PADDING,
dd\->y \- (LINE_HEIGHT \- 1.0) * SIZE_CODEBLOCK,
right \- left + 2.0 * CODE_PADDING, lineheight);
pdfioContentFillAndStroke(dd\->st, false);
set_color(dd, DOCCOLOR_RED);
pdfioContentTextShow(dd\->st, UNICODE_VALUE, mmdGetText(code));
dd\->y \-= lineheight;
if (dd\->y < dd\->art_box.y1)
{
// End the current text block...
pdfioContentTextEnd(dd\->st);
// Start a new page...
new_page(dd);
set_font(dd, DOCFONT_MONOSPACE, SIZE_CODEBLOCK);
dd\->y \-= lineheight;
pdfioContentTextBegin(dd\->st);
pdfioContentTextMoveTo(dd\->st, left, dd\->y);
}
}
// End the current text block...
pdfioContentTextEnd(dd\->st);
dd\->y += lineheight;
// Draw the bottom padding...
set_color(dd, DOCCOLOR_LTGRAY);
pdfioContentPathRect(dd\->st, left \- CODE_PADDING,
dd\->y \- CODE_PADDING \- (LINE_HEIGHT \- 1.0) * SIZE_CODEBLOCK,
right \- left + 2.0 * CODE_PADDING, CODE_PADDING);
pdfioContentFillAndStroke(dd\->st, false);
.fi
.PP
Formatting Tables
.PP
Tables are the most difficult to format. We start by scanning the entire table and measuring every cell with the measure_cell function:
.nf
for (num_cols = 0, num_rows = 0, rowptr = rows, current = mmdGetFirstChild(table);
current && num_rows < TABLEROW_MAX;
current = next)
{
next = mmd_walk_next(table, current);
type = mmdGetType(current);
if (type == MMD_TYPE_TABLE_ROW)
{
// Parse row...
for (col = 0, current = mmdGetFirstChild(current);
current && num_cols < TABLECOL_MAX;
current = mmdGetNextSibling(current), col ++)
{
rowptr\->cells[col] = current;
measure_cell(dd, current, cols + col);
if (col >= num_cols)
num_cols = col + 1;
}
rowptr ++;
num_rows ++;
}
}
.fi
.PP
The measure_cell function also updates the minimum and maximum width needed for each column. To this we add the cell padding to compute the total table width:
.nf
// Figure out the width of each column...
for (col = 0, table_width = 0.0; col < num_cols; col ++)
{
cols[col].max_width += 2.0 * TABLE_PADDING;
table_width += cols[col].max_width;
cols[col].width = cols[col].max_width;
}
.fi
.PP
If the calculated width is more than the available width, we need to adjust the width of the columns. The algorithm used here breaks the available width into N equal\-width columns \- any columns wider than this will be scaled proportionately. This works out as two steps \- one to calculate the the base width of "narrow" columns and a second to distribute the remaining width amongst the wider columns:
.nf
format_width = right \- left \- 2.0 * TABLE_PADDING * num_cols;
if (table_width > format_width)
{
// Content too wide, try scaling the widths...
double avg_width, // Average column width
base_width, // Base width
remaining_width, // Remaining width
scale_width; // Width for scaling
size_t num_remaining_cols = 0; // Number of remaining columns
// First mark any columns that are narrower than the average width...
avg_width = format_width / num_cols;
for (col = 0, base_width = 0.0, remaining_width = 0.0; col < num_cols; col ++)
{
if (cols[col].width > avg_width)
{
remaining_width += cols[col].width;
num_remaining_cols ++;
}
else
{
base_width += cols[col].width;
}
}
// Then proportionately distribute the remaining width to the other columns...
format_width \-= base_width;
for (col = 0, table_width = 0.0; col < num_cols; col ++)
{
if (cols[col].width > avg_width)
cols[col].width = cols[col].width * format_width / remaining_width;
table_width += cols[col].width;
}
}
.fi
.PP
Now that we have the widths of the columns, we can calculate the left and right margins of each column for formatting the cell text:
.nf
// Calculate the margins of each column in preparation for formatting
for (col = 0, x = left + TABLE_PADDING; col < num_cols; col ++)
{
cols[col].left = x;
cols[col].right = x + cols[col].width;
x += cols[col].width + 2.0 * TABLE_PADDING;
}
.fi
.PP
Then we re\-measure the cells using the final column widths to determine the height of each cell and row:
.nf
// Calculate the height of each row and cell in preparation for formatting
for (row = 0, rowptr = rows; row < num_rows; row ++, rowptr ++)
{
for (col = 0; col < num_cols; col ++)
{
height = measure_cell(dd, rowptr\->cells[col], cols + col) + 2.0 * TABLE_PADDING;
if (height > rowptr\->height)
rowptr\->height = height;
}
}
.fi
.PP
Finally, we render each row in the table:
.nf
// Render each table row...
for (row = 0, rowptr = rows; row < num_rows; row ++, rowptr ++)
render_row(dd, num_cols, cols, rowptr);
.fi
.PP
Rendering the Markdown Document
.PP
The formatted content in arrays of linefrag_t and tablerow_t structures are passed to the render_line and render_row functions respectively to produce content in the PDF document.
.PP
Rendering a Line in a Paragraph, Heading, or Table Cell
.PP
The render_line function adds content from the linefrag_t array to a PDF page. It starts by determining whether a new page is needed:
.nf
if (!dd\->st)
{
new_page(dd);
margin_top = 0.0;
}
dd\->y \-= margin_top + lineheight;
if ((dd\->y \- need_bottom) < dd\->art_box.y1)
{
new_page(dd);
dd\->y \-= lineheight;
}
.fi
.PP
We then loops through the fragments for the current line, drawing checkboxes, images, and text as needed. When a hyperlink is present, we add the link to the links array in the docdata_t structure, mapping "@" and "@@" to an internal link corresponding to the linked text:
.nf
if (frag\->url && dd\->num_links < DOCLINK_MAX)
{
doclink_t *l = dd\->links + dd\->num_links;
// Pointer to this link record
if (!strcmp(frag\->url, "@"))
{
// Use mapped text as link target...
char targetlink[129]; // Targeted link
targetlink[0] = '#';
make_target_name(targetlink + 1, frag\->text, sizeof(targetlink) \- 1);
l\->url = pdfioStringCreate(dd\->pdf, targetlink);
}
else if (!strcmp(frag\->url, "@@"))
{
// Use literal text as anchor...
l\->url = pdfioStringCreatef(dd\->pdf, "#%s", frag\->text);
}
else
{
// Use URL as\-is...
l\->url = frag\->url;
}
l\->box.x1 = frag\->x;
l\->box.y1 = dd\->y;
l\->box.x2 = frag\->x + frag\->width;
l\->box.y2 = dd\->y + frag\->height;
dd\->num_links ++;
}
.fi
.PP
These are later written as annotations in the add_links function.
.PP
Rendering a Table Row
.PP
The render_row function takes a row of cells and the corresponding column definitions. It starts by drawing the border boxes around body cells:
.nf
if (mmdGetType(row\->cells[0]) == MMD_TYPE_TABLE_HEADER_CELL)
{
// Header row, no border...
deffont = DOCFONT_BOLD;
}
else
{
// Regular body row, add borders...
deffont = DOCFONT_REGULAR;
set_color(dd, DOCCOLOR_GRAY);
pdfioContentPathRect(dd\->st, cols[0].left \- TABLE_PADDING, dd\->y \- row\->height,
cols[num_cols \- 1].right \- cols[0].left +
2.0 * TABLE_PADDING, row\->height);
for (col = 1; col < num_cols; col ++)
{
pdfioContentPathMoveTo(dd\->st, cols[col].left \- TABLE_PADDING, dd\->y);
pdfioContentPathLineTo(dd\->st, cols[col].left \- TABLE_PADDING, dd\->y \- row\->height);
}
pdfioContentStroke(dd\->st);
}
.fi
.PP
Then it formats each cell using the format_block function described previously. The page y value is reset before formatting each cell:
.nf
row_y = dd\->y;
for (col = 0; col < num_cols; col ++)
{
dd|>y = row_y;
format_block(dd, row\->cells[col], deffont, SIZE_TABLE, cols[col].left,
cols[col].right, /*leader*/NULL);
}
dd\->y = row_y \- row\->height;
.fi
.SH ENUMERATIONS .SH ENUMERATIONS
.SS pdfio_cs_e .SS pdfio_cs_e

View File

@ -505,7 +505,7 @@ span.string {
</div> </div>
<div class="body"> <div class="body">
<h2 class="title" id="introduction">Introduction</h2> <h2 class="title" id="introduction">Introduction</h2>
<p>PDFio is a simple C library for reading and writing PDF files. The primary goals of pdfio are:</p> <p>PDFio is a simple C library for reading and writing PDF files. The primary goals of PDFio are:</p>
<ul> <ul>
<li><p>Read and write any version of PDF file</p> <li><p>Read and write any version of PDF file</p>
</li> </li>
@ -709,8 +709,8 @@ startxref % startxref keyword
<h3 class="title" id="reading-pdf-files">Reading PDF Files</h3> <h3 class="title" id="reading-pdf-files">Reading PDF Files</h3>
<p>You open an existing PDF file using the <a href="#pdfioFileOpen"><code>pdfioFileOpen</code></a> function:</p> <p>You open an existing PDF file using the <a href="#pdfioFileOpen"><code>pdfioFileOpen</code></a> function:</p>
<pre><code class="language-c">pdfio_file_t *pdf = <pre><code class="language-c">pdfio_file_t *pdf =
pdfioFileOpen(<span class="string">&quot;myinputfile.pdf&quot;</span>, password_cb, password_data, pdfioFileOpen(<span class="string">&quot;myinputfile.pdf&quot;</span>, password_cb, password_data, error_cb,
error_cb, error_data); error_data);
</code></pre> </code></pre>
<p>where the five arguments to the function are the filename (&quot;myinputfile.pdf&quot;), an optional password callback function (<code>password_cb</code>) and data pointer value (<code>password_data</code>), and an optional error callback function (<code>error_cb</code>) and data pointer value (<code>error_data</code>). The password callback is called for encrypted PDF files that are not using the default password, for example:</p> <p>where the five arguments to the function are the filename (&quot;myinputfile.pdf&quot;), an optional password callback function (<code>password_cb</code>) and data pointer value (<code>password_data</code>), and an optional error callback function (<code>error_cb</code>) and data pointer value (<code>error_data</code>). The password callback is called for encrypted PDF files that are not using the default password, for example:</p>
<pre><code class="language-c"><span class="reserved">const</span> <span class="reserved">char</span> * <pre><code class="language-c"><span class="reserved">const</span> <span class="reserved">char</span> *
@ -817,8 +817,7 @@ pdfio_array_t *crop_box; <span class="comment">// CropBox array</span>
<pre><code class="language-c">pdfio_rect_t media_box = { <span class="number">0.0</span>, <span class="number">0.0</span>, <span class="number">612.0</span>, <span class="number">792.0</span> }; <span class="comment">// US Letter</span> <pre><code class="language-c">pdfio_rect_t media_box = { <span class="number">0.0</span>, <span class="number">0.0</span>, <span class="number">612.0</span>, <span class="number">792.0</span> }; <span class="comment">// US Letter</span>
pdfio_rect_t crop_box = { <span class="number">36.0</span>, <span class="number">36.0</span>, <span class="number">576.0</span>, <span class="number">756.0</span> }; <span class="comment">// w/0.5&quot; margins</span> pdfio_rect_t crop_box = { <span class="number">36.0</span>, <span class="number">36.0</span>, <span class="number">576.0</span>, <span class="number">756.0</span> }; <span class="comment">// w/0.5&quot; margins</span>
pdfio_file_t *pdf = pdfioFileCreate(<span class="string">&quot;myoutputfile.pdf&quot;</span>, <span class="string">&quot;2.0&quot;</span>, pdfio_file_t *pdf = pdfioFileCreate(<span class="string">&quot;myoutputfile.pdf&quot;</span>, <span class="string">&quot;2.0&quot;</span>, &amp;media_box, &amp;crop_box,
&amp;media_box, &amp;crop_box,
error_cb, error_data); error_cb, error_data);
</code></pre> </code></pre>
<p>where the six arguments to the function are the filename (&quot;myoutputfile.pdf&quot;), PDF version (&quot;2.0&quot;), media box (<code>media_box</code>), crop box (<code>crop_box</code>), an optional error callback function (<code>error_cb</code>), and an optional pointer value for the error callback function (<code>error_data</code>). The units for the media and crop boxes are points (1/72nd of an inch).</p> <p>where the six arguments to the function are the filename (&quot;myoutputfile.pdf&quot;), PDF version (&quot;2.0&quot;), media box (<code>media_box</code>), crop box (<code>crop_box</code>), an optional error callback function (<code>error_cb</code>), and an optional pointer value for the error callback function (<code>error_data</code>). The units for the media and crop boxes are points (1/72nd of an inch).</p>
@ -826,9 +825,8 @@ pdfio_file_t *pdf = pdfioFileCreate(<span class="string">&quot;myoutputfile.pdf&
<pre><code class="language-c">pdfio_rect_t media_box = { <span class="number">0.0</span>, <span class="number">0.0</span>, <span class="number">612.0</span>, <span class="number">792.0</span> }; <span class="comment">// US Letter</span> <pre><code class="language-c">pdfio_rect_t media_box = { <span class="number">0.0</span>, <span class="number">0.0</span>, <span class="number">612.0</span>, <span class="number">792.0</span> }; <span class="comment">// US Letter</span>
pdfio_rect_t crop_box = { <span class="number">36.0</span>, <span class="number">36.0</span>, <span class="number">576.0</span>, <span class="number">756.0</span> }; <span class="comment">// w/0.5&quot; margins</span> pdfio_rect_t crop_box = { <span class="number">36.0</span>, <span class="number">36.0</span>, <span class="number">576.0</span>, <span class="number">756.0</span> }; <span class="comment">// w/0.5&quot; margins</span>
pdfio_file_t *pdf = pdfioFileCreateOutput(output_cb, output_ctx, <span class="string">&quot;2.0&quot;</span>, pdfio_file_t *pdf = pdfioFileCreateOutput(output_cb, output_ctx, <span class="string">&quot;2.0&quot;</span>, &amp;media_box,
&amp;media_box, &amp;crop_box, &amp;crop_box, error_cb, error_data);
error_cb, error_data);
</code></pre> </code></pre>
<p>Once the file is created, use the <a href="#pdfioFileCreateObj"><code>pdfioFileCreateObj</code></a>, <a href="#pdfioFileCreatePage"><code>pdfioFileCreatePage</code></a>, and <a href="#pdfioPageCopy"><code>pdfioPageCopy</code></a> functions to create objects and pages in the file.</p> <p>Once the file is created, use the <a href="#pdfioFileCreateObj"><code>pdfioFileCreateObj</code></a>, <a href="#pdfioFileCreatePage"><code>pdfioFileCreatePage</code></a>, and <a href="#pdfioPageCopy"><code>pdfioPageCopy</code></a> functions to create objects and pages in the file.</p>
<p>Finally, the <a href="#pdfioFileClose"><code>pdfioFileClose</code></a> function writes the PDF cross-reference and &quot;trailer&quot; information, closes the file, and frees all memory that was used for it.</p> <p>Finally, the <a href="#pdfioFileClose"><code>pdfioFileClose</code></a> function writes the PDF cross-reference and &quot;trailer&quot; information, closes the file, and frees all memory that was used for it.</p>
@ -998,10 +996,9 @@ pdfio_obj_t *arial =
<pre><code class="language-c">pdfio_file_t *pdf = pdfioFileCreate(...); <pre><code class="language-c">pdfio_file_t *pdf = pdfioFileCreate(...);
<span class="reserved">unsigned</span> <span class="reserved">char</span> data[<span class="number">1024</span> * <span class="number">1024</span> * <span class="number">4</span>]; <span class="comment">// 1024x1024 RGBA image data</span> <span class="reserved">unsigned</span> <span class="reserved">char</span> data[<span class="number">1024</span> * <span class="number">1024</span> * <span class="number">4</span>]; <span class="comment">// 1024x1024 RGBA image data</span>
pdfio_obj_t *img = pdfio_obj_t *img =
pdfioFileCreateImageObjFromData(pdf, data, <span class="comment">/*width*/</span><span class="number">1024</span>, pdfioFileCreateImageObjFromData(pdf, data, <span class="comment">/*width*/</span><span class="number">1024</span>, <span class="comment">/*height*/</span><span class="number">1024</span>,
<span class="comment">/*height*/</span><span class="number">1024</span>, <span class="comment">/*num_colors*/</span><span class="number">3</span>, <span class="comment">/*num_colors*/</span><span class="number">3</span>, <span class="comment">/*color_data*/</span>NULL,
<span class="comment">/*color_data*/</span>NULL, <span class="comment">/*alpha*/</span><span class="reserved">true</span>, <span class="comment">/*alpha*/</span><span class="reserved">true</span>, <span class="comment">/*interpolate*/</span><span class="reserved">false</span>);
<span class="comment">/*interpolate*/</span><span class="reserved">false</span>);
</code></pre> </code></pre>
<p>will create an object for a 1024x1024 RGBA image in memory, using the default color space for 3 colors (&quot;DeviceRGB&quot;). We can use one of the <a href="#color-space-functions">color space functions</a> to use a specific color space for this image, for example:</p> <p>will create an object for a 1024x1024 RGBA image in memory, using the default color space for 3 colors (&quot;DeviceRGB&quot;). We can use one of the <a href="#color-space-functions">color space functions</a> to use a specific color space for this image, for example:</p>
<pre><code class="language-c">pdfio_file_t *pdf = pdfioFileCreate(...); <pre><code class="language-c">pdfio_file_t *pdf = pdfioFileCreate(...);
@ -1009,24 +1006,20 @@ pdfio_obj_t *img =
<span class="comment">// Create an AdobeRGB color array</span> <span class="comment">// Create an AdobeRGB color array</span>
pdfio_array_t *adobe_rgb = pdfio_array_t *adobe_rgb =
pdfioArrayCreateColorFromMatrix(pdf, <span class="number">3</span>, pdfioAdobeRGBGamma, pdfioArrayCreateColorFromMatrix(pdf, <span class="number">3</span>, pdfioAdobeRGBGamma,
pdfioAdobeRGBMatrix, pdfioAdobeRGBMatrix, pdfioAdobeRGBWhitePoint);
pdfioAdobeRGBWhitePoint);
<span class="comment">// Create a 1024x1024 RGBA image using AdobeRGB</span> <span class="comment">// Create a 1024x1024 RGBA image using AdobeRGB</span>
<span class="reserved">unsigned</span> <span class="reserved">char</span> data[<span class="number">1024</span> * <span class="number">1024</span> * <span class="number">4</span>]; <span class="comment">// 1024x1024 RGBA image data</span> <span class="reserved">unsigned</span> <span class="reserved">char</span> data[<span class="number">1024</span> * <span class="number">1024</span> * <span class="number">4</span>]; <span class="comment">// 1024x1024 RGBA image data</span>
pdfio_obj_t *img = pdfio_obj_t *img =
pdfioFileCreateImageObjFromData(pdf, data, <span class="comment">/*width*/</span><span class="number">1024</span>, pdfioFileCreateImageObjFromData(pdf, data, <span class="comment">/*width*/</span><span class="number">1024</span>, <span class="comment">/*height*/</span><span class="number">1024</span>,
<span class="comment">/*height*/</span><span class="number">1024</span>, <span class="comment">/*num_colors*/</span><span class="number">3</span>, <span class="comment">/*num_colors*/</span><span class="number">3</span>, <span class="comment">/*color_data*/</span>adobe_rgb,
<span class="comment">/*color_data*/</span>adobe_rgb, <span class="comment">/*alpha*/</span><span class="reserved">true</span>, <span class="comment">/*interpolate*/</span><span class="reserved">false</span>);
<span class="comment">/*alpha*/</span><span class="reserved">true</span>,
<span class="comment">/*interpolate*/</span><span class="reserved">false</span>);
</code></pre> </code></pre>
<p>The &quot;interpolate&quot; argument specifies whether the colors in the image should be smoothed/interpolated when scaling. This is most useful for photographs but should be <code>false</code> for screenshot and barcode images.</p> <p>The &quot;interpolate&quot; argument specifies whether the colors in the image should be smoothed/interpolated when scaling. This is most useful for photographs but should be <code>false</code> for screenshot and barcode images.</p>
<p>If you have a JPEG or PNG file, use the <a href="#pdfioFileCreateImageObjFromFile"><code>pdfioFileCreateImageObjFromFile</code></a> function to copy the image into a PDF image object, for example:</p> <p>If you have a JPEG or PNG file, use the <a href="#pdfioFileCreateImageObjFromFile"><code>pdfioFileCreateImageObjFromFile</code></a> function to copy the image into a PDF image object, for example:</p>
<pre><code class="language-c">pdfio_file_t *pdf = pdfioFileCreate(...); <pre><code class="language-c">pdfio_file_t *pdf = pdfioFileCreate(...);
pdfio_obj_t *img = pdfio_obj_t *img =
pdfioFileCreateImageObjFromFile(pdf, <span class="string">&quot;myphoto.jpg&quot;</span>, pdfioFileCreateImageObjFromFile(pdf, <span class="string">&quot;myphoto.jpg&quot;</span>, <span class="comment">/*interpolate*/</span><span class="reserved">true</span>);
<span class="comment">/*interpolate*/</span><span class="reserved">true</span>);
</code></pre> </code></pre>
<blockquote> <blockquote>
<p>Note: Currently <code>pdfioFileCreateImageObjFromFile</code> does not support 12 bit JPEG files or PNG files with an alpha channel.</p> <p>Note: Currently <code>pdfioFileCreateImageObjFromFile</code> does not support 12 bit JPEG files or PNG files with an alpha channel.</p>
@ -1181,9 +1174,8 @@ main(<span class="reserved">int</span> argc, <span clas
filename = argv[<span class="number">1</span>]; filename = argv[<span class="number">1</span>];
<span class="comment">// Open the PDF file with the default callbacks...</span> <span class="comment">// Open the PDF file with the default callbacks...</span>
pdf = pdfioFileOpen(filename, <span class="comment">/*password_cb*/</span>NULL, pdf = pdfioFileOpen(filename, <span class="comment">/*password_cb*/</span>NULL, <span class="comment">/*password_cbdata*/</span>NULL,
<span class="comment">/*password_cbdata*/</span>NULL, <span class="comment">/*error_cb*/</span>NULL, <span class="comment">/*error_cb*/</span>NULL, <span class="comment">/*error_cbdata*/</span>NULL);
<span class="comment">/*error_cbdata*/</span>NULL);
<span class="reserved">if</span> (pdf == NULL) <span class="reserved">if</span> (pdf == NULL)
<span class="reserved">return</span> (<span class="number">1</span>); <span class="reserved">return</span> (<span class="number">1</span>);
@ -1229,9 +1221,8 @@ create_pdf_image_file(
<span class="comment">// Create the PDF file...</span> <span class="comment">// Create the PDF file...</span>
pdf = pdfioFileCreate(pdfname, <span class="comment">/*version*/</span>NULL, <span class="comment">/*media_box*/</span>NULL, pdf = pdfioFileCreate(pdfname, <span class="comment">/*version*/</span>NULL, <span class="comment">/*media_box*/</span>NULL, <span class="comment">/*crop_box*/</span>NULL,
<span class="comment">/*crop_box*/</span>NULL, <span class="comment">/*error_cb*/</span>NULL, <span class="comment">/*error_cb*/</span>NULL, <span class="comment">/*error_cbdata*/</span>NULL);
<span class="comment">/*error_cbdata*/</span>NULL);
<span class="reserved">if</span> (!pdf) <span class="reserved">if</span> (!pdf)
<span class="reserved">return</span> (<span class="reserved">false</span>); <span class="reserved">return</span> (<span class="reserved">false</span>);
@ -1265,9 +1256,9 @@ create_pdf_image_file(
width = pdfioImageGetWidth(image); width = pdfioImageGetWidth(image);
height = pdfioImageGetHeight(image); height = pdfioImageGetHeight(image);
<span class="comment">// Default media_box is &quot;universal&quot; 595.28x792 points (8.27x11in or</span> <span class="comment">// Default media_box is &quot;universal&quot; 595.28x792 points (8.27x11in or 210x279mm).</span>
<span class="comment">// 210x279mm). Use margins of 36 points (0.5in or 12.7mm) with another</span> <span class="comment">// Use margins of 36 points (0.5in or 12.7mm) with another 36 points for the</span>
<span class="comment">// 36 points for the caption underneath...</span> <span class="comment">// caption underneath...</span>
swidth = <span class="number">595.28</span> - <span class="number">72.0</span>; swidth = <span class="number">595.28</span> - <span class="number">72.0</span>;
sheight = swidth * height / width; sheight = swidth * height / width;
<span class="reserved">if</span> (sheight &gt; (<span class="number">792.0</span> - <span class="number">36.0</span> - <span class="number">72.0</span>)) <span class="reserved">if</span> (sheight &gt; (<span class="number">792.0</span> - <span class="number">36.0</span> - <span class="number">72.0</span>))
@ -1284,8 +1275,8 @@ create_pdf_image_file(
<span class="comment">// Draw the caption in black...</span> <span class="comment">// Draw the caption in black...</span>
pdfioContentSetFillColorDeviceGray(page, <span class="number">0.0</span>); pdfioContentSetFillColorDeviceGray(page, <span class="number">0.0</span>);
<span class="comment">// Compute the starting point for the text - Courier is monospaced</span> <span class="comment">// Compute the starting point for the text - Courier is monospaced with a</span>
<span class="comment">// with a nominal width of 0.6 times the text height...</span> <span class="comment">// nominal width of 0.6 times the text height...</span>
tx = <span class="number">0.5</span> * (<span class="number">595.28</span> - <span class="number">18.0</span> * <span class="number">0.6</span> * strlen(caption)); tx = <span class="number">0.5</span> * (<span class="number">595.28</span> - <span class="number">18.0</span> * <span class="number">0.6</span> * strlen(caption));
<span class="comment">// Position and draw the caption underneath...</span> <span class="comment">// Position and draw the caption underneath...</span>
@ -1353,8 +1344,7 @@ make_code128(<span class="reserved">char</span> *dst, <span clas
} }
</code></pre> </code></pre>
<p>The <code>main</code> function does the rest of the work. The barcode font is imported using the <a href="#pdfioFileCreateFontObjFromFile"><code>pdfioFileCreateFontObjFromFile</code></a> function. We pass <code>false</code> for the &quot;unicode&quot; argument since we just want the (default) ASCII encoding:</p> <p>The <code>main</code> function does the rest of the work. The barcode font is imported using the <a href="#pdfioFileCreateFontObjFromFile"><code>pdfioFileCreateFontObjFromFile</code></a> function. We pass <code>false</code> for the &quot;unicode&quot; argument since we just want the (default) ASCII encoding:</p>
<pre><code class="language-c">barcode_font = pdfioFileCreateFontObjFromFile(pdf, <span class="string">&quot;code128.ttf&quot;</span>, <pre><code class="language-c">barcode_font = pdfioFileCreateFontObjFromFile(pdf, <span class="string">&quot;code128.ttf&quot;</span>, <span class="comment">/*unicode*/</span><span class="reserved">false</span>);
<span class="comment">/*unicode*/</span><span class="reserved">false</span>);
</code></pre> </code></pre>
<p>Since barcodes usually have the number or text represented by the barcode printed underneath it, we also need a regular text font, for which we can choose one of the standard 14 PostScript base fonts using the <a href="#pdfioFIleCreateFontObjFromBase"><code>pdfioFIleCreateFontObjFromBase</code></a> function:</p> <p>Since barcodes usually have the number or text represented by the barcode printed underneath it, we also need a regular text font, for which we can choose one of the standard 14 PostScript base fonts using the <a href="#pdfioFIleCreateFontObjFromBase"><code>pdfioFIleCreateFontObjFromBase</code></a> function:</p>
<pre><code class="language-c">text_font = pdfioFileCreateFontObjFromBase(pdf, <span class="string">&quot;Helvetica&quot;</span>); <pre><code class="language-c">text_font = pdfioFileCreateFontObjFromBase(pdf, <span class="string">&quot;Helvetica&quot;</span>);
@ -1378,8 +1368,7 @@ make_code128(<span class="reserved">char</span> *dst, <span clas
<span class="reserved">if</span> (text &amp;&amp; text_font) <span class="reserved">if</span> (text &amp;&amp; text_font)
{ {
text_height = <span class="number">9.0</span>; text_height = <span class="number">9.0</span>;
text_width = pdfioContentTextMeasure(text_font, text, text_width = pdfioContentTextMeasure(text_font, text, text_height);
text_height);
} }
<span class="comment">// Compute the size of the PDF page...</span> <span class="comment">// Compute the size of the PDF page...</span>
@ -1387,8 +1376,7 @@ pdfio_rect_t media_box;
media_box.x1 = <span class="number">0.0</span>; media_box.x1 = <span class="number">0.0</span>;
media_box.y1 = <span class="number">0.0</span>; media_box.y1 = <span class="number">0.0</span>;
media_box.x2 = (barcode_width &gt; text_width ? media_box.x2 = (barcode_width &gt; text_width ? barcode_width : text_width) + <span class="number">18.0</span>;
barcode_width : text_width) + <span class="number">18.0</span>;
media_box.y2 = barcode_height + text_height + <span class="number">18.0</span>; media_box.y2 = barcode_height + text_height + <span class="number">18.0</span>;
</code></pre> </code></pre>
<p>Finally, we just need to create a page of the specified size that references the two fonts:</p> <p>Finally, we just need to create a page of the specified size that references the two fonts:</p>
@ -1429,8 +1417,650 @@ pdfioStreamClose(page_st);
<h3 class="title" id="convert-markdown-to-pdf">Convert Markdown to PDF</h3> <h3 class="title" id="convert-markdown-to-pdf">Convert Markdown to PDF</h3>
<p>Markdown is a simple plain text format that supports things like headings, links, character styles, tables, and embedded images. The <code>md2pdf.c</code> example code uses the <a href="https://www.msweet.org/mmd/">mmd</a> library to convert markdown to a PDF file that can be distributed.</p> <p>Markdown is a simple plain text format that supports things like headings, links, character styles, tables, and embedded images. The <code>md2pdf.c</code> example code uses the <a href="https://www.msweet.org/mmd/">mmd</a> library to convert markdown to a PDF file that can be distributed.</p>
<blockquote> <blockquote>
<p>Note: The md2pdf example is by far the most complex example code included with PDFio and shows how to layout text, add headers and footers, add links, embed images, and format tables.</p> <p>Note: The md2pdf example is by far the most complex example code included with PDFio and shows how to layout text, add headers and footers, add links, embed images, format tables, and add an outline (table of contents) for navigation.</p>
</blockquote> </blockquote>
<h4 id="managing-document-state">Managing Document State</h4>
<p>The <code>md2pdf</code> program needs to maintain three sets of state - one for the markdown document which is represented by nodes of type <code>mmd_t</code> and the others for the PDF document and current PDF page which are contained in the <code>docdata_t</code> structure:</p>
<pre><code class="language-c"><span class="reserved">typedef</span> <span class="reserved">struct</span> docdata_s <span class="comment">// Document formatting data</span>
{
<span class="comment">// State for the whole document</span>
pdfio_file_t *pdf; <span class="comment">// PDF file</span>
pdfio_rect_t media_box; <span class="comment">// Media (page) box</span>
pdfio_rect_t crop_box; <span class="comment">// Crop box (for margins)</span>
pdfio_rect_t art_box; <span class="comment">// Art box (for markdown content)</span>
pdfio_obj_t *fonts[DOCFONT_MAX]; <span class="comment">// Embedded fonts</span>
<span class="reserved">double</span> font_space; <span class="comment">// Unit width of a space</span>
size_t num_images; <span class="comment">// Number of embedded images</span>
docimage_t images[DOCIMAGE_MAX]; <span class="comment">// Embedded images</span>
<span class="reserved">const</span> <span class="reserved">char</span> *title; <span class="comment">// Document title</span>
<span class="reserved">char</span> *heading; <span class="comment">// Current document heading</span>
size_t num_actions; <span class="comment">// Number of actions for this document</span>
docaction_t actions[DOCACTION_MAX]; <span class="comment">// Actions for this document</span>
size_t num_targets; <span class="comment">// Number of targets for this document</span>
doctarget_t targets[DOCTARGET_MAX]; <span class="comment">// Targets for this document</span>
size_t num_toc; <span class="comment">// Number of table-of-contents entries</span>
doctoc_t toc[DOCTOC_MAX]; <span class="comment">// Table-of-contents entries</span>
<span class="comment">// State for the current page</span>
pdfio_stream_t *st; <span class="comment">// Current page stream</span>
<span class="reserved">double</span> y; <span class="comment">// Current position on page</span>
docfont_t font; <span class="comment">// Current font</span>
<span class="reserved">double</span> fsize; <span class="comment">// Current font size</span>
doccolor_t color; <span class="comment">// Current color</span>
pdfio_array_t *annots_array; <span class="comment">// Annotations array (for links)</span>
pdfio_obj_t *annots_obj; <span class="comment">// Annotations object (for links)</span>
size_t num_links; <span class="comment">// Number of links for this page</span>
doclink_t links[DOCLINK_MAX]; <span class="comment">// Links for this page</span>
} docdata_t;
</code></pre>
<h5 id="document-state">Document State</h5>
<p>The output is fixed to the &quot;universal&quot; media size (the intersection of US Letter and ISO A4) with 1/2 inch margins - the <code>PAGE_</code> constants can be changed to select a different size or margins. The <code>media_box</code> member contains the &quot;MediaBox&quot; rectangle for the PDF pages, while the <code>crop_box</code> and <code>art_box</code> members contain the &quot;CropBox&quot; and &quot;ArtBox&quot; values, respectively.</p>
<p>Four embedded fonts are used:</p>
<ul>
<li><p><code>DOCFONT_REGULAR</code>: the default font used for text,</p>
</li>
<li><p><code>DOCFONT_BOLD</code>: a boldface font used for heading and strong text,</p>
</li>
<li><p><code>DOCFONT_ITALIC</code>: an italic/oblique font used for emphasized text, and</p>
</li>
<li><p><code>DOCFONT_MONOSPACE</code>: a fixed-width font used for code.</p>
</li>
</ul>
<p>By default the code uses the base PostScript fonts Helvetica, Helvetica-Bold, Helvetica-Oblique, and Courier. The <code>USE_TRUETYPE</code> define can be used to replace these with the Roboto TrueType fonts.</p>
<p>Embedded JPEG and PNG images are copied into the PDF document, with the <code>images</code> array containing the list of the images and their objects.</p>
<p>The <code>title</code> member contains the document title, while the <code>heading</code> member contains the current heading text.</p>
<p>The <code>actions</code> array contains a list of action dictionaries for interior document links that need to be resolved, while the <code>targets</code> array keeps track of the location of the headings in the PDF document.</p>
<p>The <code>toc</code> array contains a list of headings and is used to construct the PDF outlines dictionaries/objects, which provides a table of contents for navigation in most PDF readers.</p>
<h5 id="page-state">Page State</h5>
<p>The <code>st</code> member provides the stream for the current page content. The <code>color</code>, <code>font</code>, <code>fsize</code>, and <code>y</code> members provide the current graphics state on the page.</p>
<p>The <code>annots_array</code>, <code>annots_obj</code>, <code>num_links</code>, and <code>links</code> members contain a list of hyperlinks on the current page.</p>
<h4 id="creating-pages">Creating Pages</h4>
<p>The <code>new_page</code> function is used to start a new page. Aside from creating the new page object and stream, it adds a standard header and footer to the page. It starts by closing the current page if it is open:</p>
<pre><code class="language-c"><span class="comment">// Close the current page...</span>
<span class="reserved">if</span> (dd-&gt;st)
{
pdfioStreamClose(dd-&gt;st);
add_links(dd);
}
</code></pre>
<p>The new page needs a dictionary containing any link annotations, the media and art boxes, the four fonts, and any images:</p>
<pre><code class="language-c"><span class="comment">// Prep the new page...</span>
page_dict = pdfioDictCreate(dd-&gt;pdf);
dd-&gt;annots_array = pdfioArrayCreate(dd-&gt;pdf);
dd-&gt;annots_obj = pdfioFileCreateArrayObj(dd-&gt;pdf, dd-&gt;annots_array);
pdfioDictSetObj(page_dict, <span class="string">&quot;Annots&quot;</span>, dd-&gt;annots_obj);
pdfioDictSetRect(page_dict, <span class="string">&quot;MediaBox&quot;</span>, &amp;dd-&gt;media_box);
pdfioDictSetRect(page_dict, <span class="string">&quot;ArtBox&quot;</span>, &amp;dd-&gt;art_box);
<span class="reserved">for</span> (fontface = DOCFONT_REGULAR; fontface &lt; DOCFONT_MAX; fontface ++)
pdfioPageDictAddFont(page_dict, docfont_names[fontface], dd-&gt;fonts[fontface]);
<span class="reserved">for</span> (i = <span class="number">0</span>; i &lt; dd-&gt;num_images; i ++)
pdfioPageDictAddImage(page_dict, pdfioStringCreatef(dd-&gt;pdf, <span class="string">&quot;I%u&quot;</span>, (<span class="reserved">unsigned</span>)i),
dd-&gt;images[i].obj);
</code></pre>
<p>Once the page dictionary is initialized, we create a new page and initialize the current graphics state:</p>
<pre><code class="language-c">dd-&gt;st = pdfioFileCreatePage(dd-&gt;pdf, page_dict);
dd-&gt;color = DOCCOLOR_BLACK;
dd-&gt;font = DOCFONT_MAX;
dd-&gt;fsize = <span class="number">0.0</span>;
dd-&gt;y = dd-&gt;art_box.y2;
</code></pre>
<p>The header consists of a dark gray separating line and the document title. We don't show the header on the first page:</p>
<pre><code class="language-c"><span class="comment">// Add header/footer text</span>
set_color(dd, DOCCOLOR_GRAY);
set_font(dd, DOCFONT_REGULAR, SIZE_HEADFOOT);
<span class="reserved">if</span> (pdfioFileGetNumPages(dd-&gt;pdf) &gt; <span class="number">1</span> &amp;&amp; dd-&gt;title)
{
<span class="comment">// Show title in header...</span>
width = pdfioContentTextMeasure(dd-&gt;fonts[DOCFONT_REGULAR], dd-&gt;title,
SIZE_HEADFOOT);
pdfioContentTextBegin(dd-&gt;st);
pdfioContentTextMoveTo(dd-&gt;st,
dd-&gt;crop_box.x1 + <span class="number">0.5</span> * (dd-&gt;crop_box.x2 -
dd-&gt;crop_box.x1 - width),
dd-&gt;crop_box.y2 - SIZE_HEADFOOT);
pdfioContentTextShow(dd-&gt;st, UNICODE_VALUE, dd-&gt;title);
pdfioContentTextEnd(dd-&gt;st);
pdfioContentPathMoveTo(dd-&gt;st, dd-&gt;crop_box.x1,
dd-&gt;crop_box.y2 - <span class="number">2</span> * SIZE_HEADFOOT * LINE_HEIGHT +
SIZE_HEADFOOT);
pdfioContentPathLineTo(dd-&gt;st, dd-&gt;crop_box.x2,
dd-&gt;crop_box.y2 - <span class="number">2</span> * SIZE_HEADFOOT * LINE_HEIGHT +
SIZE_HEADFOOT);
pdfioContentStroke(dd-&gt;st);
}
</code></pre>
<p>The footer contains the same dark gray separating line with the current heading and page number on opposite sides. The page number is always positioned on the outer edge for a two-sided print - right justified on odd numbered pages and left justified on even numbered pages:</p>
<pre><code class="language-c"><span class="comment">// Show page number and current heading...</span>
pdfioContentPathMoveTo(dd-&gt;st, dd-&gt;crop_box.x1,
dd-&gt;crop_box.y1 + SIZE_HEADFOOT * LINE_HEIGHT);
pdfioContentPathLineTo(dd-&gt;st, dd-&gt;crop_box.x2,
dd-&gt;crop_box.y1 + SIZE_HEADFOOT * LINE_HEIGHT);
pdfioContentStroke(dd-&gt;st);
pdfioContentTextBegin(dd-&gt;st);
snprintf(temp, <span class="reserved">sizeof</span>(temp), <span class="string">&quot;%u&quot;</span>, (<span class="reserved">unsigned</span>)pdfioFileGetNumPages(dd-&gt;pdf));
<span class="reserved">if</span> (pdfioFileGetNumPages(dd-&gt;pdf) &amp; <span class="number">1</span>)
{
<span class="comment">// Page number on right...</span>
width = pdfioContentTextMeasure(dd-&gt;fonts[DOCFONT_REGULAR], temp, SIZE_HEADFOOT);
pdfioContentTextMoveTo(dd-&gt;st, dd-&gt;crop_box.x2 - width, dd-&gt;crop_box.y1);
}
<span class="reserved">else</span>
{
<span class="comment">// Page number on left...</span>
pdfioContentTextMoveTo(dd-&gt;st, dd-&gt;crop_box.x1, dd-&gt;crop_box.y1);
}
pdfioContentTextShow(dd-&gt;st, UNICODE_VALUE, temp);
pdfioContentTextEnd(dd-&gt;st);
<span class="reserved">if</span> (dd-&gt;heading)
{
pdfioContentTextBegin(dd-&gt;st);
<span class="reserved">if</span> (pdfioFileGetNumPages(dd-&gt;pdf) &amp; <span class="number">1</span>)
{
<span class="comment">// Current heading on left...</span>
pdfioContentTextMoveTo(dd-&gt;st, dd-&gt;crop_box.x1, dd-&gt;crop_box.y1);
}
<span class="reserved">else</span>
{
width = pdfioContentTextMeasure(dd-&gt;fonts[DOCFONT_REGULAR], dd-&gt;heading,
SIZE_HEADFOOT);
pdfioContentTextMoveTo(dd-&gt;st, dd-&gt;crop_box.x2 - width, dd-&gt;crop_box.y1);
}
pdfioContentTextShow(dd-&gt;st, UNICODE_VALUE, dd-&gt;heading);
pdfioContentTextEnd(dd-&gt;st);
}
</code></pre>
<h4 id="formatting-the-markdown-document">Formatting the Markdown Document</h4>
<p>Four functions handle the formatting of the markdown document:</p>
<ul>
<li><p><code>format_block</code> formats a single paragraph, heading, or table cell,</p>
</li>
<li><p><code>format_code</code>: formats a block of code,</p>
</li>
<li><p><code>format_doc</code>: formats the document as a whole, and</p>
</li>
<li><p><code>format_table</code>: formats a table.</p>
</li>
</ul>
<p>Formatted content is organized into arrays of <code>linefrag_t</code> and <code>tablerow_t</code> structures for a line of content or row of table cells, respectively.</p>
<h5 id="high-level-formatting">High-Level Formatting</h5>
<p>The <code>format_doc</code> function iterates over the block nodes in the markdown document. We map a &quot;thematic break&quot; (horizontal rule) to a page break, which is implemented by moving the current vertical position to the bottom of the page:</p>
<pre><code class="language-c"><span class="reserved">case</span> MMD_TYPE_THEMATIC_BREAK :
<span class="comment">// Force a page break</span>
dd-&gt;y = dd-&gt;art_box.y1;
<span class="reserved">break</span>;
</code></pre>
<p>A block quote is indented and uses the italic font by default:</p>
<pre><code class="language-c"><span class="reserved">case</span> MMD_TYPE_BLOCK_QUOTE :
format_doc(dd, current, DOCFONT_ITALIC, left + BQ_PADDING, right - BQ_PADDING);
<span class="reserved">break</span>;
</code></pre>
<p>Lists have a leading blank line and are indented:</p>
<pre><code class="language-c"><span class="reserved">case</span> MMD_TYPE_ORDERED_LIST :
<span class="reserved">case</span> MMD_TYPE_UNORDERED_LIST :
<span class="reserved">if</span> (dd-&gt;st)
dd-&gt;y -= SIZE_BODY * LINE_HEIGHT;
format_doc(dd, current, deffont, left + LIST_PADDING, right);
<span class="reserved">break</span>;
</code></pre>
<p>List items do not have a leading blank line and make use of leader text that is shown in front of the list text. The leader text is either the current item number or a bullet, which then is directly formatted using the <code>format_block</code> function:</p>
<pre><code class="language-c"><span class="reserved">case</span> MMD_TYPE_LIST_ITEM :
<span class="reserved">if</span> (doctype == MMD_TYPE_ORDERED_LIST)
{
snprintf(leader, <span class="reserved">sizeof</span>(leader), <span class="string">&quot;%d. &quot;</span>, i);
format_block(dd, current, deffont, SIZE_BODY, left, right, leader);
}
<span class="reserved">else</span>
{
format_block(dd, current, deffont, SIZE_BODY, left, right, <span class="comment">/*leader*/</span><span class="string">&quot;• &quot;</span>);
}
<span class="reserved">break</span>;
</code></pre>
<p>Paragraphs have a leading blank line and are likewise directly formatted:</p>
<pre><code class="language-c"><span class="reserved">case</span> MMD_TYPE_PARAGRAPH :
<span class="comment">// Add a blank line before the paragraph...</span>
dd-&gt;y -= SIZE_BODY * LINE_HEIGHT;
<span class="comment">// Format the paragraph...</span>
format_block(dd, current, deffont, SIZE_BODY, left, right, <span class="comment">/*leader*/</span>NULL);
<span class="reserved">break</span>;
</code></pre>
<p>Tables have a leading blank line and are formatted using the <code>format_table</code> function:</p>
<pre><code class="language-c"><span class="reserved">case</span> MMD_TYPE_TABLE :
<span class="comment">// Add a blank line before the paragraph...</span>
dd-&gt;y -= SIZE_BODY * LINE_HEIGHT;
<span class="comment">// Format the table...</span>
format_table(dd, current, left, right);
<span class="reserved">break</span>;
</code></pre>
<p>Code blocks have a leading blank line, are indented slightly (to account for the padded background), and are formatted using the <code>format_code</code> function:</p>
<pre><code class="language-c"><span class="reserved">case</span> MMD_TYPE_CODE_BLOCK :
<span class="comment">// Add a blank line before the code block...</span>
dd-&gt;y -= SIZE_BODY * LINE_HEIGHT;
<span class="comment">// Format the code block...</span>
format_code(dd, current, left + CODE_PADDING, right - CODE_PADDING);
<span class="reserved">break</span>;
</code></pre>
<p>Headings get some extra processing. First, the current heading is remembered in the <code>docdata_t</code> structure so it can be used in the page footer:</p>
<pre><code class="language-c"><span class="reserved">case</span> MMD_TYPE_HEADING_1 :
<span class="reserved">case</span> MMD_TYPE_HEADING_2 :
<span class="reserved">case</span> MMD_TYPE_HEADING_3 :
<span class="reserved">case</span> MMD_TYPE_HEADING_4 :
<span class="reserved">case</span> MMD_TYPE_HEADING_5 :
<span class="reserved">case</span> MMD_TYPE_HEADING_6 :
<span class="comment">// Update the current heading</span>
free(dd-&gt;heading);
dd-&gt;heading = mmdCopyAllText(current);
</code></pre>
<p>Then we add a blank line and format the heading with the boldface font at a larger size using the <code>format_block</code> function:</p>
<pre><code class="language-c"> <span class="comment">// Add a blank line before the heading...</span>
dd-&gt;y -= heading_sizes[curtype - MMD_TYPE_HEADING_1] * LINE_HEIGHT;
<span class="comment">// Format the heading...</span>
format_block(dd, current, DOCFONT_BOLD,
heading_sizes[curtype - MMD_TYPE_HEADING_1], left, right,
<span class="comment">/*leader*/</span>NULL);
</code></pre>
<p>Once the heading is formatted, we record it in the <code>toc</code> array as a PDF outline item object/dictionary:</p>
<pre><code class="language-c"> <span class="comment">// Add the heading to the table-of-contents...</span>
<span class="reserved">if</span> (dd-&gt;num_toc &lt; DOCTOC_MAX)
{
doctoc_t *t = dd-&gt;toc + dd-&gt;num_toc;
<span class="comment">// New TOC</span>
pdfio_array_t *dest; <span class="comment">// Destination array</span>
t-&gt;level = curtype - MMD_TYPE_HEADING_1;
t-&gt;dict = pdfioDictCreate(dd-&gt;pdf);
t-&gt;obj = pdfioFileCreateObj(dd-&gt;pdf, t-&gt;dict);
dest = pdfioArrayCreate(dd-&gt;pdf);
pdfioArrayAppendObj(dest,
pdfioFileGetPage(dd-&gt;pdf, pdfioFileGetNumPages(dd-&gt;pdf) - <span class="number">1</span>));
pdfioArrayAppendName(dest, <span class="string">&quot;XYZ&quot;</span>);
pdfioArrayAppendNumber(dest, PAGE_LEFT);
pdfioArrayAppendNumber(dest,
dd-&gt;y + heading_sizes[curtype - MMD_TYPE_HEADING_1] * LINE_HEIGHT);
pdfioArrayAppendNumber(dest, <span class="number">0.0</span>);
pdfioDictSetArray(t-&gt;dict, <span class="string">&quot;Dest&quot;</span>, dest);
pdfioDictSetString(t-&gt;dict, <span class="string">&quot;Title&quot;</span>, pdfioStringCreate(dd-&gt;pdf, dd-&gt;heading));
dd-&gt;num_toc ++;
}
</code></pre>
<p>Finally, we also save the heading's target name and its location in the <code>targets</code> array to allow interior links to work:</p>
<pre><code class="language-c"> <span class="comment">// Add the heading to the list of link targets...</span>
<span class="reserved">if</span> (dd-&gt;num_targets &lt; DOCTARGET_MAX)
{
doctarget_t *t = dd-&gt;targets + dd-&gt;num_targets;
<span class="comment">// New target</span>
make_target_name(t-&gt;name, dd-&gt;heading, <span class="reserved">sizeof</span>(t-&gt;name));
t-&gt;page = pdfioFileGetNumPages(dd-&gt;pdf) - <span class="number">1</span>;
t-&gt;y = dd-&gt;y + heading_sizes[curtype - MMD_TYPE_HEADING_1] * LINE_HEIGHT;
dd-&gt;num_targets ++;
}
<span class="reserved">break</span>;
</code></pre>
<h5 id="formatting-paragraphs-headings-list-items-and-table-cells">Formatting Paragraphs, Headings, List Items, and Table Cells</h5>
<p>Paragraphs, headings, list items, and table cells all use the same basic formatting algorithm. Text, checkboxes, and images are collected until the nodes in the current block are used up or the content reaches the right margin.</p>
<p>In order to keep adjacent blocks of text together, the formatting algorithm makes sure that at least 3 lines of text can fit before the bottom edge of the page:</p>
<pre><code class="language-c"><span class="reserved">if</span> (mmdGetNextSibling(block))
need_bottom = <span class="number">3.0</span> * SIZE_BODY * LINE_HEIGHT;
<span class="reserved">else</span>
need_bottom = <span class="number">0.0</span>;
</code></pre>
<p>Leader text (used for list items) is right justified to the left margin and becomes the first fragment on the line when present.</p>
<pre><code class="language-c"><span class="reserved">if</span> (leader)
{
<span class="comment">// Add leader text on first line...</span>
frags[<span class="number">0</span>].type = MMD_TYPE_NORMAL_TEXT;
frags[<span class="number">0</span>].width = pdfioContentTextMeasure(dd-&gt;fonts[deffont], leader, fsize);
frags[<span class="number">0</span>].height = fsize;
frags[<span class="number">0</span>].x = left - frags[<span class="number">0</span>].width;
frags[<span class="number">0</span>].imagenum = <span class="number">0</span>;
frags[<span class="number">0</span>].text = leader;
frags[<span class="number">0</span>].url = NULL;
frags[<span class="number">0</span>].ws = <span class="reserved">false</span>;
frags[<span class="number">0</span>].font = deffont;
frags[<span class="number">0</span>].color = DOCCOLOR_BLACK;
num_frags = <span class="number">1</span>;
lineheight = fsize * LINE_HEIGHT;
}
<span class="reserved">else</span>
{
<span class="comment">// No leader text...</span>
num_frags = <span class="number">0</span>;
lineheight = <span class="number">0.0</span>;
}
frag = frags + num_frags;
</code></pre>
<p>If the current content fragment won't fit, we call <code>render_line</code> to draw what we have, adjusting the left margin as needed for table cells:</p>
<pre><code class="language-c"> <span class="comment">// See if this node will fit on the current line...</span>
<span class="reserved">if</span> ((num_frags &gt; <span class="number">0</span> &amp;&amp; (x + width + wswidth) &gt;= right) || num_frags == LINEFRAG_MAX)
{
<span class="comment">// No, render this line and start over...</span>
<span class="reserved">if</span> (blocktype == MMD_TYPE_TABLE_HEADER_CELL ||
blocktype == MMD_TYPE_TABLE_BODY_CELL_CENTER)
margin_left = <span class="number">0.5</span> * (right - x);
<span class="reserved">else</span> <span class="reserved">if</span> (blocktype == MMD_TYPE_TABLE_BODY_CELL_RIGHT)
margin_left = right - x;
<span class="reserved">else</span>
margin_left = <span class="number">0.0</span>;
render_line(dd, margin_left, need_bottom, lineheight, num_frags, frags);
num_frags = <span class="number">0</span>;
frag = frags;
x = left;
lineheight = <span class="number">0.0</span>;
need_bottom = <span class="number">0.0</span>;
</code></pre>
<p>Block quotes (blocks use a default font of italic) have an orange bar to the left of the block:</p>
<pre><code class="language-c"> <span class="reserved">if</span> (deffont == DOCFONT_ITALIC)
{
<span class="comment">// Add an orange bar to the left of block quotes...</span>
set_color(dd, DOCCOLOR_ORANGE);
pdfioContentSave(dd-&gt;st);
pdfioContentSetLineWidth(dd-&gt;st, <span class="number">3.0</span>);
pdfioContentPathMoveTo(dd-&gt;st, left - <span class="number">6.0</span>, dd-&gt;y - (LINE_HEIGHT - <span class="number">1.0</span>) * fsize);
pdfioContentPathLineTo(dd-&gt;st, left - <span class="number">6.0</span>, dd-&gt;y + fsize);
pdfioContentStroke(dd-&gt;st);
pdfioContentRestore(dd-&gt;st);
}
</code></pre>
<p>Finally, we add the current content fragment to the array:</p>
<pre><code class="language-c"> <span class="comment">// Add the current node to the fragment list</span>
<span class="reserved">if</span> (num_frags == <span class="number">0</span>)
{
<span class="comment">// No leading whitespace at the start of the line</span>
ws = <span class="reserved">false</span>;
wswidth = <span class="number">0.0</span>;
}
frag-&gt;type = type;
frag-&gt;x = x;
frag-&gt;width = width + wswidth;
frag-&gt;height = text ? fsize : height;
frag-&gt;imagenum = imagenum;
frag-&gt;text = text;
frag-&gt;url = url;
frag-&gt;ws = ws;
frag-&gt;font = font;
frag-&gt;color = color;
num_frags ++;
frag ++;
x += width + wswidth;
<span class="reserved">if</span> (height &gt; lineheight)
lineheight = height;
</code></pre>
<h5 id="formatting-code-blocks">Formatting Code Blocks</h5>
<p>Code blocks consist of one or more lines of plain monospaced text. We draw a light gray background behind each line with a small bit of padding at the top and bottom:</p>
<pre><code class="language-c"><span class="comment">// Draw the top padding...</span>
set_color(dd, DOCCOLOR_LTGRAY);
pdfioContentPathRect(dd-&gt;st, left - CODE_PADDING, dd-&gt;y + SIZE_CODEBLOCK,
right - left + <span class="number">2.0</span> * CODE_PADDING, CODE_PADDING);
pdfioContentFillAndStroke(dd-&gt;st, <span class="reserved">false</span>);
<span class="comment">// Start a code text block...</span>
set_font(dd, DOCFONT_MONOSPACE, SIZE_CODEBLOCK);
pdfioContentTextBegin(dd-&gt;st);
pdfioContentTextMoveTo(dd-&gt;st, left, dd-&gt;y);
<span class="reserved">for</span> (code = mmdGetFirstChild(block); code; code = mmdGetNextSibling(code))
{
set_color(dd, DOCCOLOR_LTGRAY);
pdfioContentPathRect(dd-&gt;st, left - CODE_PADDING,
dd-&gt;y - (LINE_HEIGHT - <span class="number">1.0</span>) * SIZE_CODEBLOCK,
right - left + <span class="number">2.0</span> * CODE_PADDING, lineheight);
pdfioContentFillAndStroke(dd-&gt;st, <span class="reserved">false</span>);
set_color(dd, DOCCOLOR_RED);
pdfioContentTextShow(dd-&gt;st, UNICODE_VALUE, mmdGetText(code));
dd-&gt;y -= lineheight;
<span class="reserved">if</span> (dd-&gt;y &lt; dd-&gt;art_box.y1)
{
<span class="comment">// End the current text block...</span>
pdfioContentTextEnd(dd-&gt;st);
<span class="comment">// Start a new page...</span>
new_page(dd);
set_font(dd, DOCFONT_MONOSPACE, SIZE_CODEBLOCK);
dd-&gt;y -= lineheight;
pdfioContentTextBegin(dd-&gt;st);
pdfioContentTextMoveTo(dd-&gt;st, left, dd-&gt;y);
}
}
<span class="comment">// End the current text block...</span>
pdfioContentTextEnd(dd-&gt;st);
dd-&gt;y += lineheight;
<span class="comment">// Draw the bottom padding...</span>
set_color(dd, DOCCOLOR_LTGRAY);
pdfioContentPathRect(dd-&gt;st, left - CODE_PADDING,
dd-&gt;y - CODE_PADDING - (LINE_HEIGHT - <span class="number">1.0</span>) * SIZE_CODEBLOCK,
right - left + <span class="number">2.0</span> * CODE_PADDING, CODE_PADDING);
pdfioContentFillAndStroke(dd-&gt;st, <span class="reserved">false</span>);
</code></pre>
<h5 id="formatting-tables">Formatting Tables</h5>
<p>Tables are the most difficult to format. We start by scanning the entire table and measuring every cell with the <code>measure_cell</code> function:</p>
<pre><code class="language-c"><span class="reserved">for</span> (num_cols = <span class="number">0</span>, num_rows = <span class="number">0</span>, rowptr = rows, current = mmdGetFirstChild(table);
current &amp;&amp; num_rows &lt; TABLEROW_MAX;
current = next)
{
next = mmd_walk_next(table, current);
type = mmdGetType(current);
<span class="reserved">if</span> (type == MMD_TYPE_TABLE_ROW)
{
<span class="comment">// Parse row...</span>
<span class="reserved">for</span> (col = <span class="number">0</span>, current = mmdGetFirstChild(current);
current &amp;&amp; num_cols &lt; TABLECOL_MAX;
current = mmdGetNextSibling(current), col ++)
{
rowptr-&gt;cells[col] = current;
measure_cell(dd, current, cols + col);
<span class="reserved">if</span> (col &gt;= num_cols)
num_cols = col + <span class="number">1</span>;
}
rowptr ++;
num_rows ++;
}
}
</code></pre>
<p>The <code>measure_cell</code> function also updates the minimum and maximum width needed for each column. To this we add the cell padding to compute the total table width:</p>
<pre><code class="language-c"><span class="comment">// Figure out the width of each column...</span>
<span class="reserved">for</span> (col = <span class="number">0</span>, table_width = <span class="number">0.0</span>; col &lt; num_cols; col ++)
{
cols[col].max_width += <span class="number">2.0</span> * TABLE_PADDING;
table_width += cols[col].max_width;
cols[col].width = cols[col].max_width;
}
</code></pre>
<p>If the calculated width is more than the available width, we need to adjust the width of the columns. The algorithm used here breaks the available width into N equal-width columns - any columns wider than this will be scaled proportionately. This works out as two steps - one to calculate the the base width of &quot;narrow&quot; columns and a second to distribute the remaining width amongst the wider columns:</p>
<pre><code class="language-c">format_width = right - left - <span class="number">2.0</span> * TABLE_PADDING * num_cols;
<span class="reserved">if</span> (table_width &gt; format_width)
{
<span class="comment">// Content too wide, try scaling the widths...</span>
<span class="reserved">double</span> avg_width, <span class="comment">// Average column width</span>
base_width, <span class="comment">// Base width</span>
remaining_width, <span class="comment">// Remaining width</span>
scale_width; <span class="comment">// Width for scaling</span>
size_t num_remaining_cols = <span class="number">0</span>; <span class="comment">// Number of remaining columns</span>
<span class="comment">// First mark any columns that are narrower than the average width...</span>
avg_width = format_width / num_cols;
<span class="reserved">for</span> (col = <span class="number">0</span>, base_width = <span class="number">0.0</span>, remaining_width = <span class="number">0.0</span>; col &lt; num_cols; col ++)
{
<span class="reserved">if</span> (cols[col].width &gt; avg_width)
{
remaining_width += cols[col].width;
num_remaining_cols ++;
}
<span class="reserved">else</span>
{
base_width += cols[col].width;
}
}
<span class="comment">// Then proportionately distribute the remaining width to the other columns...</span>
format_width -= base_width;
<span class="reserved">for</span> (col = <span class="number">0</span>, table_width = <span class="number">0.0</span>; col &lt; num_cols; col ++)
{
<span class="reserved">if</span> (cols[col].width &gt; avg_width)
cols[col].width = cols[col].width * format_width / remaining_width;
table_width += cols[col].width;
}
}
</code></pre>
<p>Now that we have the widths of the columns, we can calculate the left and right margins of each column for formatting the cell text:</p>
<pre><code class="language-c"><span class="comment">// Calculate the margins of each column in preparation for formatting</span>
<span class="reserved">for</span> (col = <span class="number">0</span>, x = left + TABLE_PADDING; col &lt; num_cols; col ++)
{
cols[col].left = x;
cols[col].right = x + cols[col].width;
x += cols[col].width + <span class="number">2.0</span> * TABLE_PADDING;
}
</code></pre>
<p>Then we re-measure the cells using the final column widths to determine the height of each cell and row:</p>
<pre><code class="language-c"><span class="comment">// Calculate the height of each row and cell in preparation for formatting</span>
<span class="reserved">for</span> (row = <span class="number">0</span>, rowptr = rows; row &lt; num_rows; row ++, rowptr ++)
{
<span class="reserved">for</span> (col = <span class="number">0</span>; col &lt; num_cols; col ++)
{
height = measure_cell(dd, rowptr-&gt;cells[col], cols + col) + <span class="number">2.0</span> * TABLE_PADDING;
<span class="reserved">if</span> (height &gt; rowptr-&gt;height)
rowptr-&gt;height = height;
}
}
</code></pre>
<p>Finally, we render each row in the table:</p>
<pre><code class="language-c"><span class="comment">// Render each table row...</span>
<span class="reserved">for</span> (row = <span class="number">0</span>, rowptr = rows; row &lt; num_rows; row ++, rowptr ++)
render_row(dd, num_cols, cols, rowptr);
</code></pre>
<h4 id="rendering-the-markdown-document">Rendering the Markdown Document</h4>
<p>The formatted content in arrays of <code>linefrag_t</code> and <code>tablerow_t</code> structures are passed to the <code>render_line</code> and <code>render_row</code> functions respectively to produce content in the PDF document.</p>
<h5 id="rendering-a-line-in-a-paragraph-heading-or-table-cell">Rendering a Line in a Paragraph, Heading, or Table Cell</h5>
<p>The <code>render_line</code> function adds content from the <code>linefrag_t</code> array to a PDF page. It starts by determining whether a new page is needed:</p>
<pre><code class="language-c"><span class="reserved">if</span> (!dd-&gt;st)
{
new_page(dd);
margin_top = <span class="number">0.0</span>;
}
dd-&gt;y -= margin_top + lineheight;
<span class="reserved">if</span> ((dd-&gt;y - need_bottom) &lt; dd-&gt;art_box.y1)
{
new_page(dd);
dd-&gt;y -= lineheight;
}
</code></pre>
<p>We then loops through the fragments for the current line, drawing checkboxes, images, and text as needed. When a hyperlink is present, we add the link to the <code>links</code> array in the <code>docdata_t</code> structure, mapping &quot;@&quot; and &quot;@@&quot; to an internal link corresponding to the linked text:</p>
<pre><code class="language-c"><span class="reserved">if</span> (frag-&gt;url &amp;&amp; dd-&gt;num_links &lt; DOCLINK_MAX)
{
doclink_t *l = dd-&gt;links + dd-&gt;num_links;
<span class="comment">// Pointer to this link record</span>
<span class="reserved">if</span> (!strcmp(frag-&gt;url, <span class="string">&quot;@&quot;</span>))
{
<span class="comment">// Use mapped text as link target...</span>
<span class="reserved">char</span> targetlink[<span class="number">129</span>]; <span class="comment">// Targeted link</span>
targetlink[<span class="number">0</span>] = <span class="string">'#'</span>;
make_target_name(targetlink + <span class="number">1</span>, frag-&gt;text, <span class="reserved">sizeof</span>(targetlink) - <span class="number">1</span>);
l-&gt;url = pdfioStringCreate(dd-&gt;pdf, targetlink);
}
<span class="reserved">else</span> <span class="reserved">if</span> (!strcmp(frag-&gt;url, <span class="string">&quot;@@&quot;</span>))
{
<span class="comment">// Use literal text as anchor...</span>
l-&gt;url = pdfioStringCreatef(dd-&gt;pdf, <span class="string">&quot;#%s&quot;</span>, frag-&gt;text);
}
<span class="reserved">else</span>
{
<span class="comment">// Use URL as-is...</span>
l-&gt;url = frag-&gt;url;
}
l-&gt;box.x1 = frag-&gt;x;
l-&gt;box.y1 = dd-&gt;y;
l-&gt;box.x2 = frag-&gt;x + frag-&gt;width;
l-&gt;box.y2 = dd-&gt;y + frag-&gt;height;
dd-&gt;num_links ++;
}
</code></pre>
<p>These are later written as annotations in the <code>add_links</code> function.</p>
<h5 id="rendering-a-table-row">Rendering a Table Row</h5>
<p>The <code>render_row</code> function takes a row of cells and the corresponding column definitions. It starts by drawing the border boxes around body cells:</p>
<pre><code class="language-c"><span class="reserved">if</span> (mmdGetType(row-&gt;cells[<span class="number">0</span>]) == MMD_TYPE_TABLE_HEADER_CELL)
{
<span class="comment">// Header row, no border...</span>
deffont = DOCFONT_BOLD;
}
<span class="reserved">else</span>
{
<span class="comment">// Regular body row, add borders...</span>
deffont = DOCFONT_REGULAR;
set_color(dd, DOCCOLOR_GRAY);
pdfioContentPathRect(dd-&gt;st, cols[<span class="number">0</span>].left - TABLE_PADDING, dd-&gt;y - row-&gt;height,
cols[num_cols - <span class="number">1</span>].right - cols[<span class="number">0</span>].left +
<span class="number">2.0</span> * TABLE_PADDING, row-&gt;height);
<span class="reserved">for</span> (col = <span class="number">1</span>; col &lt; num_cols; col ++)
{
pdfioContentPathMoveTo(dd-&gt;st, cols[col].left - TABLE_PADDING, dd-&gt;y);
pdfioContentPathLineTo(dd-&gt;st, cols[col].left - TABLE_PADDING, dd-&gt;y - row-&gt;height);
}
pdfioContentStroke(dd-&gt;st);
}
</code></pre>
<p>Then it formats each cell using the <code>format_block</code> function described previously. The page <code>y</code> value is reset before formatting each cell:</p>
<pre><code class="language-c">row_y = dd-&gt;y;
<span class="reserved">for</span> (col = <span class="number">0</span>; col &lt; num_cols; col ++)
{
ddì&gt;y = row_y;
format_block(dd, row-&gt;cells[col], deffont, SIZE_TABLE, cols[col].left,
cols[col].right, <span class="comment">/*leader*/</span>NULL);
}
dd-&gt;y = row_y - row-&gt;height;
</code></pre>
<h2 class="title"><a id="FUNCTIONS">Functions</a></h2> <h2 class="title"><a id="FUNCTIONS">Functions</a></h2>
<h3 class="function"><a id="pdfioArrayAppendArray">pdfioArrayAppendArray</a></h3> <h3 class="function"><a id="pdfioArrayAppendArray">pdfioArrayAppendArray</a></h3>
<p class="description">Add an array value to an array.</p> <p class="description">Add an array value to an array.</p>

View File

@ -1430,57 +1430,45 @@ structures for a line of content or row of table cells, respectively.
#### High-Level Formatting #### High-Level Formatting
The `format_doc` function iterates over the block nodes in the markdown
document. We map a "thematic break" (horizontal rule) to a page break, which
is implemented by moving the current vertical position to the bottom of the
page:
```c ```c
static void case MMD_TYPE_THEMATIC_BREAK :
format_doc(docdata_t *dd, // I - Document data
mmd_t *doc, // I - Document node to format
docfont_t deffont, // I - Default font
double left, // I - Left margin
double right) // I - Right margin
{
int i; // Child number
mmd_type_t doctype; // Document node type
mmd_t *current; // Current node
mmd_type_t curtype; // Current node type
char leader[32]; // Leader
static const double heading_sizes[] = // Heading font sizes
{
SIZE_HEADING_1,
SIZE_HEADING_2,
SIZE_HEADING_3,
SIZE_HEADING_4,
SIZE_HEADING_5,
SIZE_HEADING_6
};
doctype = mmdGetType(doc);
for (i = 1, current = mmdGetFirstChild(doc); current; i ++, current = mmdGetNextSibling(current))
{
switch (curtype = mmdGetType(current))
{
default :
break;
case MMD_TYPE_THEMATIC_BREAK :
// Force a page break // Force a page break
dd->y = dd->art_box.y1; dd->y = dd->art_box.y1;
break; break;
```
case MMD_TYPE_BLOCK_QUOTE : A block quote is indented and uses the italic font by default:
format_doc(dd, current, DOCFONT_ITALIC, left + 36.0, right - 36.0);
```c
case MMD_TYPE_BLOCK_QUOTE :
format_doc(dd, current, DOCFONT_ITALIC, left + BQ_PADDING, right - BQ_PADDING);
break; break;
```
case MMD_TYPE_ORDERED_LIST : Lists have a leading blank line and are indented:
case MMD_TYPE_UNORDERED_LIST :
```c
case MMD_TYPE_ORDERED_LIST :
case MMD_TYPE_UNORDERED_LIST :
if (dd->st) if (dd->st)
dd->y -= SIZE_BODY * LINE_HEIGHT; dd->y -= SIZE_BODY * LINE_HEIGHT;
format_doc(dd, current, deffont, left + 36.0, right); format_doc(dd, current, deffont, left + LIST_PADDING, right);
break; break;
```
case MMD_TYPE_LIST_ITEM : List items do not have a leading blank line and make use of leader text that is
shown in front of the list text. The leader text is either the current item
number or a bullet, which then is directly formatted using the `format_block`
function:
```c
case MMD_TYPE_LIST_ITEM :
if (doctype == MMD_TYPE_ORDERED_LIST) if (doctype == MMD_TYPE_ORDERED_LIST)
{ {
snprintf(leader, sizeof(leader), "%d. ", i); snprintf(leader, sizeof(leader), "%d. ", i);
@ -1491,19 +1479,79 @@ format_doc(docdata_t *dd, // I - Document data
format_block(dd, current, deffont, SIZE_BODY, left, right, /*leader*/"• "); format_block(dd, current, deffont, SIZE_BODY, left, right, /*leader*/"• ");
} }
break; break;
```
case MMD_TYPE_HEADING_1 : Paragraphs have a leading blank line and are likewise directly formatted:
case MMD_TYPE_HEADING_2 :
case MMD_TYPE_HEADING_3 : ```c
case MMD_TYPE_HEADING_4 : case MMD_TYPE_PARAGRAPH :
case MMD_TYPE_HEADING_5 : // Add a blank line before the paragraph...
case MMD_TYPE_HEADING_6 : dd->y -= SIZE_BODY * LINE_HEIGHT;
// Format the paragraph...
format_block(dd, current, deffont, SIZE_BODY, left, right, /*leader*/NULL);
break;
```
Tables have a leading blank line and are formatted using the `format_table`
function:
```c
case MMD_TYPE_TABLE :
// Add a blank line before the paragraph...
dd->y -= SIZE_BODY * LINE_HEIGHT;
// Format the table...
format_table(dd, current, left, right);
break;
```
Code blocks have a leading blank line, are indented slightly (to account for the
padded background), and are formatted using the `format_code` function:
```c
case MMD_TYPE_CODE_BLOCK :
// Add a blank line before the code block...
dd->y -= SIZE_BODY * LINE_HEIGHT;
// Format the code block...
format_code(dd, current, left + CODE_PADDING, right - CODE_PADDING);
break;
```
Headings get some extra processing. First, the current heading is remembered in
the `docdata_t` structure so it can be used in the page footer:
```c
case MMD_TYPE_HEADING_1 :
case MMD_TYPE_HEADING_2 :
case MMD_TYPE_HEADING_3 :
case MMD_TYPE_HEADING_4 :
case MMD_TYPE_HEADING_5 :
case MMD_TYPE_HEADING_6 :
// Update the current heading
free(dd->heading); free(dd->heading);
dd->heading = mmdCopyAllText(current); dd->heading = mmdCopyAllText(current);
```
format_block(dd, current, DOCFONT_BOLD, heading_sizes[curtype - MMD_TYPE_HEADING_1], left, right, /*leader*/NULL); Then we add a blank line and format the heading with the boldface font at a
larger size using the `format_block` function:
```c
// Add a blank line before the heading...
dd->y -= heading_sizes[curtype - MMD_TYPE_HEADING_1] * LINE_HEIGHT;
// Format the heading...
format_block(dd, current, DOCFONT_BOLD,
heading_sizes[curtype - MMD_TYPE_HEADING_1], left, right,
/*leader*/NULL);
```
Once the heading is formatted, we record it in the `toc` array as a PDF outline
item object/dictionary:
```c
// Add the heading to the table-of-contents...
if (dd->num_toc < DOCTOC_MAX) if (dd->num_toc < DOCTOC_MAX)
{ {
doctoc_t *t = dd->toc + dd->num_toc; doctoc_t *t = dd->toc + dd->num_toc;
@ -1515,10 +1563,12 @@ format_doc(docdata_t *dd, // I - Document data
t->obj = pdfioFileCreateObj(dd->pdf, t->dict); t->obj = pdfioFileCreateObj(dd->pdf, t->dict);
dest = pdfioArrayCreate(dd->pdf); dest = pdfioArrayCreate(dd->pdf);
pdfioArrayAppendObj(dest, pdfioFileGetPage(dd->pdf, pdfioFileGetNumPages(dd->pdf) - 1)); pdfioArrayAppendObj(dest,
pdfioFileGetPage(dd->pdf, pdfioFileGetNumPages(dd->pdf) - 1));
pdfioArrayAppendName(dest, "XYZ"); pdfioArrayAppendName(dest, "XYZ");
pdfioArrayAppendNumber(dest, PAGE_LEFT); pdfioArrayAppendNumber(dest, PAGE_LEFT);
pdfioArrayAppendNumber(dest, dd->y + heading_sizes[curtype - MMD_TYPE_HEADING_1] * LINE_HEIGHT); pdfioArrayAppendNumber(dest,
dd->y + heading_sizes[curtype - MMD_TYPE_HEADING_1] * LINE_HEIGHT);
pdfioArrayAppendNumber(dest, 0.0); pdfioArrayAppendNumber(dest, 0.0);
pdfioDictSetArray(t->dict, "Dest", dest); pdfioDictSetArray(t->dict, "Dest", dest);
@ -1526,7 +1576,13 @@ format_doc(docdata_t *dd, // I - Document data
dd->num_toc ++; dd->num_toc ++;
} }
```
Finally, we also save the heading's target name and its location in the
`targets` array to allow interior links to work:
```c
// Add the heading to the list of link targets...
if (dd->num_targets < DOCTARGET_MAX) if (dd->num_targets < DOCTARGET_MAX)
{ {
doctarget_t *t = dd->targets + dd->num_targets; doctarget_t *t = dd->targets + dd->num_targets;
@ -1539,74 +1595,32 @@ format_doc(docdata_t *dd, // I - Document data
dd->num_targets ++; dd->num_targets ++;
} }
break; break;
case MMD_TYPE_PARAGRAPH :
format_block(dd, current, deffont, SIZE_BODY, left, right, /*leader*/NULL);
break;
case MMD_TYPE_TABLE :
format_table(dd, current, left, right);
break;
case MMD_TYPE_CODE_BLOCK :
format_code(dd, current, left + CODE_PADDING, right - CODE_PADDING);
break;
}
}
}
``` ```
#### Formatting Paragraphs, Headings, and Table Cells #### Formatting Paragraphs, Headings, List Items, and Table Cells
Paragraphs, headings, list items, and table cells all use the same basic
formatting algorithm. Text, checkboxes, and images are collected until the
nodes in the current block are used up or the content reaches the right margin.
In order to keep adjacent blocks of text together, the formatting algorithm
makes sure that at least 3 lines of text can fit before the bottom edge of the
page:
```c ```c
static void if (mmdGetNextSibling(block))
format_block(docdata_t *dd, // I - Document data
mmd_t *block, // I - Block to format
docfont_t deffont, // I - Default font
double fsize, // I - Size of font
double left, // I - Left margin
double right, // I - Right margin
const char *leader) // I - Leader text on the first line
{
mmd_type_t blocktype; // Block type
mmd_t *current, // Current node
*next; // Next node
size_t num_frags; // Number of line fragments
linefrag_t frags[LINEFRAG_MAX], // Line fragments
*frag; // Current fragment
mmd_type_t type; // Current node type
const char *text, // Current text
*url; // Current URL, if any
bool ws; // Current whitespace
pdfio_obj_t *image; // Current image, if any
size_t imagenum; // Current image number
doccolor_t color = DOCCOLOR_BLACK; // Current text color
docfont_t font = deffont; // Current text font
double x, // Current position
width, // Width of current fragment
wswidth, // Width of whitespace
margin_left, // Left margin
margin_top, // Top margin
need_bottom, // Space needed after this block
height, // Height of current fragment
lineheight; // Height of current line
blocktype = mmdGetType(block);
if ((blocktype >= MMD_TYPE_TABLE_HEADER_CELL && blocktype <= MMD_TYPE_TABLE_BODY_CELL_RIGHT) || blocktype == MMD_TYPE_LIST_ITEM)
margin_top = 0.0;
else
margin_top = fsize * LINE_HEIGHT;
if (mmdGetNextSibling(block))
need_bottom = 3.0 * SIZE_BODY * LINE_HEIGHT; need_bottom = 3.0 * SIZE_BODY * LINE_HEIGHT;
else else
need_bottom = 0.0; need_bottom = 0.0;
```
if (leader) Leader text (used for list items) is right justified to the left margin and
{ becomes the first fragment on the line when present.
```c
if (leader)
{
// Add leader text on first line... // Add leader text on first line...
frags[0].type = MMD_TYPE_NORMAL_TEXT; frags[0].type = MMD_TYPE_NORMAL_TEXT;
frags[0].width = pdfioContentTextMeasure(dd->fonts[deffont], leader, fsize); frags[0].width = pdfioContentTextMeasure(dd->fonts[deffont], leader, fsize);
@ -1621,131 +1635,46 @@ format_block(docdata_t *dd, // I - Document data
num_frags = 1; num_frags = 1;
lineheight = fsize * LINE_HEIGHT; lineheight = fsize * LINE_HEIGHT;
} }
else else
{ {
// No leader text... // No leader text...
num_frags = 0; num_frags = 0;
lineheight = 0.0; lineheight = 0.0;
} }
frag = frags + num_frags; frag = frags + num_frags;
```
// Loop through the block and render lines... If the current content fragment won't fit, we call `render_line` to draw what we
for (current = mmdGetFirstChild(block), x = left; current; current = next) have, adjusting the left margin as needed for table cells:
{
// Get information about the current node...
type = mmdGetType(current);
text = mmdGetText(current);
image = NULL;
imagenum = 0;
url = mmdGetURL(current);
ws = mmdGetWhitespace(current);
wswidth = ws ? dd->font_space * fsize : 0.0;
next = mmd_walk_next(block, current);
// Process the node...
if (type == MMD_TYPE_IMAGE && url)
{
// Embed an image
if ((image = find_image(dd, url, &imagenum)) == NULL)
continue;
// Image - treat as 100dpi
width = 72.0 * pdfioImageGetWidth(image) / IMAGE_PPI;
height = 72.0 * pdfioImageGetHeight(image) / IMAGE_PPI;
text = NULL;
if (width > (right - left))
{
// Too wide, scale to width...
width = right - left;
height = width * pdfioImageGetHeight(image) / pdfioImageGetWidth(image);
}
else if (height > (dd->art_box.y2 - dd->art_box.y1))
{
// Too tall, scale to height...
height = dd->art_box.y2 - dd->art_box.y1;
width = height * pdfioImageGetWidth(image) / pdfioImageGetHeight(image);
}
}
else if (type == MMD_TYPE_HARD_BREAK && num_frags > 0)
{
if (blocktype == MMD_TYPE_TABLE_HEADER_CELL || blocktype == MMD_TYPE_TABLE_BODY_CELL_CENTER)
margin_left = 0.5 * (right - x);
else if (blocktype == MMD_TYPE_TABLE_BODY_CELL_RIGHT)
margin_left = right - x;
else
margin_left = 0.0;
render_line(dd, margin_left, margin_top, need_bottom, lineheight, num_frags, frags);
if (deffont == DOCFONT_ITALIC)
{
// Add an orange bar to the left of block quotes...
set_color(dd, DOCCOLOR_ORANGE);
pdfioContentSave(dd->st);
pdfioContentSetLineWidth(dd->st, 3.0);
pdfioContentPathMoveTo(dd->st, left - 6.0, dd->y - (LINE_HEIGHT - 1.0) * fsize);
pdfioContentPathLineTo(dd->st, left - 6.0, dd->y + fsize);
pdfioContentStroke(dd->st);
pdfioContentRestore(dd->st);
}
num_frags = 0;
frag = frags;
x = left;
lineheight = 0.0;
margin_top = 0.0;
need_bottom = 0.0;
continue;
}
else if (type == MMD_TYPE_CHECKBOX)
{
// Checkbox
width = height = fsize;
}
else if (!text)
{
continue;
}
else
{
// Text fragment...
if (type == MMD_TYPE_EMPHASIZED_TEXT)
font = DOCFONT_ITALIC;
else if (type == MMD_TYPE_STRONG_TEXT)
font = DOCFONT_BOLD;
else if (type == MMD_TYPE_CODE_TEXT)
font = DOCFONT_MONOSPACE;
else
font = deffont;
if (type == MMD_TYPE_CODE_TEXT)
color = DOCCOLOR_RED;
else if (type == MMD_TYPE_LINKED_TEXT)
color = DOCCOLOR_BLUE;
else
color = DOCCOLOR_BLACK;
width = pdfioContentTextMeasure(dd->fonts[font], text, fsize);
height = fsize * LINE_HEIGHT;
}
```c
// See if this node will fit on the current line... // See if this node will fit on the current line...
if ((num_frags > 0 && (x + width + wswidth) >= right) || num_frags == LINEFRAG_MAX) if ((num_frags > 0 && (x + width + wswidth) >= right) || num_frags == LINEFRAG_MAX)
{ {
// No, render this line and start over... // No, render this line and start over...
if (blocktype == MMD_TYPE_TABLE_HEADER_CELL || blocktype == MMD_TYPE_TABLE_BODY_CELL_CENTER) if (blocktype == MMD_TYPE_TABLE_HEADER_CELL ||
blocktype == MMD_TYPE_TABLE_BODY_CELL_CENTER)
margin_left = 0.5 * (right - x); margin_left = 0.5 * (right - x);
else if (blocktype == MMD_TYPE_TABLE_BODY_CELL_RIGHT) else if (blocktype == MMD_TYPE_TABLE_BODY_CELL_RIGHT)
margin_left = right - x; margin_left = right - x;
else else
margin_left = 0.0; margin_left = 0.0;
render_line(dd, margin_left, margin_top, need_bottom, lineheight, num_frags, frags); render_line(dd, margin_left, need_bottom, lineheight, num_frags, frags);
num_frags = 0;
frag = frags;
x = left;
lineheight = 0.0;
need_bottom = 0.0;
```
Block quotes (blocks use a default font of italic) have an orange bar to the
left of the block:
```c
if (deffont == DOCFONT_ITALIC) if (deffont == DOCFONT_ITALIC)
{ {
// Add an orange bar to the left of block quotes... // Add an orange bar to the left of block quotes...
@ -1757,18 +1686,15 @@ format_block(docdata_t *dd, // I - Document data
pdfioContentStroke(dd->st); pdfioContentStroke(dd->st);
pdfioContentRestore(dd->st); pdfioContentRestore(dd->st);
} }
```
num_frags = 0; Finally, we add the current content fragment to the array:
frag = frags;
x = left;
lineheight = 0.0;
margin_top = 0.0;
need_bottom = 0.0;
}
```c
// Add the current node to the fragment list // Add the current node to the fragment list
if (num_frags == 0) if (num_frags == 0)
{ {
// No leading whitespace at the start of the line
ws = false; ws = false;
wswidth = 0.0; wswidth = 0.0;
} }
@ -1789,84 +1715,33 @@ format_block(docdata_t *dd, // I - Document data
x += width + wswidth; x += width + wswidth;
if (height > lineheight) if (height > lineheight)
lineheight = height; lineheight = height;
}
if (num_frags > 0)
{
if (blocktype == MMD_TYPE_TABLE_HEADER_CELL || blocktype == MMD_TYPE_TABLE_BODY_CELL_CENTER)
margin_left = 0.5 * (right - x);
else if (blocktype == MMD_TYPE_TABLE_BODY_CELL_RIGHT)
margin_left = right - x;
else
margin_left = 0.0;
render_line(dd, margin_left, margin_top, need_bottom, lineheight, num_frags, frags);
if (deffont == DOCFONT_ITALIC)
{
// Add an orange bar to the left of block quotes...
set_color(dd, DOCCOLOR_ORANGE);
pdfioContentSave(dd->st);
pdfioContentSetLineWidth(dd->st, 3.0);
pdfioContentPathMoveTo(dd->st, left - 6.0, dd->y - (LINE_HEIGHT - 1.0) * fsize);
pdfioContentPathLineTo(dd->st, left - 6.0, dd->y + fsize);
pdfioContentStroke(dd->st);
pdfioContentRestore(dd->st);
}
}
}
``` ```
#### Formatting Code Blocks #### Formatting Code Blocks
Code blocks consist of one or more lines of plain monospaced text. We draw a
light gray background behind each line with a small bit of padding at the top
and bottom:
```c ```c
static void // Draw the top padding...
format_code(docdata_t *dd, // I - Document data set_color(dd, DOCCOLOR_LTGRAY);
mmd_t *block, // I - Code block pdfioContentPathRect(dd->st, left - CODE_PADDING, dd->y + SIZE_CODEBLOCK,
double left, // I - Left margin right - left + 2.0 * CODE_PADDING, CODE_PADDING);
double right) // I - Right margin pdfioContentFillAndStroke(dd->st, false);
// Start a code text block...
set_font(dd, DOCFONT_MONOSPACE, SIZE_CODEBLOCK);
pdfioContentTextBegin(dd->st);
pdfioContentTextMoveTo(dd->st, left, dd->y);
for (code = mmdGetFirstChild(block); code; code = mmdGetNextSibling(code))
{ {
mmd_t *code; // Current code block
double lineheight, // Line height
margin_top; // Top margin
// Compute line height and initial top margin...
lineheight = SIZE_CODEBLOCK * LINE_HEIGHT;
margin_top = lineheight;
// Start a new page as needed...
if (!dd->st)
{
new_page(dd);
margin_top = 0.0;
}
dd->y -= lineheight + margin_top + CODE_PADDING;
if ((dd->y - lineheight) < dd->art_box.y1)
{
new_page(dd);
dd->y -= lineheight + CODE_PADDING;
}
// Draw the top padding...
set_color(dd, DOCCOLOR_LTGRAY); set_color(dd, DOCCOLOR_LTGRAY);
pdfioContentPathRect(dd->st, left - CODE_PADDING, dd->y + SIZE_CODEBLOCK, right - left + 2.0 * CODE_PADDING, CODE_PADDING); pdfioContentPathRect(dd->st, left - CODE_PADDING,
pdfioContentFillAndStroke(dd->st, false); dd->y - (LINE_HEIGHT - 1.0) * SIZE_CODEBLOCK,
right - left + 2.0 * CODE_PADDING, lineheight);
// Start a code text block...
set_font(dd, DOCFONT_MONOSPACE, SIZE_CODEBLOCK);
pdfioContentTextBegin(dd->st);
pdfioContentTextMoveTo(dd->st, left, dd->y);
for (code = mmdGetFirstChild(block); code; code = mmdGetNextSibling(code))
{
set_color(dd, DOCCOLOR_LTGRAY);
pdfioContentPathRect(dd->st, left - CODE_PADDING, dd->y - (LINE_HEIGHT - 1.0) * SIZE_CODEBLOCK, right - left + 2.0 * CODE_PADDING, lineheight);
pdfioContentFillAndStroke(dd->st, false); pdfioContentFillAndStroke(dd->st, false);
set_color(dd, DOCCOLOR_RED); set_color(dd, DOCCOLOR_RED);
@ -1887,62 +1762,40 @@ format_code(docdata_t *dd, // I - Document data
pdfioContentTextBegin(dd->st); pdfioContentTextBegin(dd->st);
pdfioContentTextMoveTo(dd->st, left, dd->y); pdfioContentTextMoveTo(dd->st, left, dd->y);
} }
}
// End the current text block...
pdfioContentTextEnd(dd->st);
dd->y += lineheight;
// Draw the bottom padding...
set_color(dd, DOCCOLOR_LTGRAY);
pdfioContentPathRect(dd->st, left - CODE_PADDING, dd->y - CODE_PADDING - (LINE_HEIGHT - 1.0) * SIZE_CODEBLOCK, right - left + 2.0 * CODE_PADDING, CODE_PADDING);
pdfioContentFillAndStroke(dd->st, false);
} }
// End the current text block...
pdfioContentTextEnd(dd->st);
dd->y += lineheight;
// Draw the bottom padding...
set_color(dd, DOCCOLOR_LTGRAY);
pdfioContentPathRect(dd->st, left - CODE_PADDING,
dd->y - CODE_PADDING - (LINE_HEIGHT - 1.0) * SIZE_CODEBLOCK,
right - left + 2.0 * CODE_PADDING, CODE_PADDING);
pdfioContentFillAndStroke(dd->st, false);
``` ```
#### Formatting Tables #### Formatting Tables
Tables are the most difficult to format. We start by scanning the entire table
and measuring every cell with the `measure_cell` function:
```c ```c
static void for (num_cols = 0, num_rows = 0, rowptr = rows, current = mmdGetFirstChild(table);
format_table(docdata_t *dd, // I - Document data current && num_rows < TABLEROW_MAX;
mmd_t *table, // I - Table node current = next)
double left, // I - Left margin
double right) // I - Right margin
{ {
mmd_t *current, // Current node
*next; // Next node
mmd_type_t type; // Node type
size_t col, // Current column
num_cols; // Number of columns
tablecol_t cols[TABLECOL_MAX]; // Columns
size_t row, // Current row
num_rows; // Number of rows
tablerow_t rows[TABLEROW_MAX], // Rows
*rowptr; // Pointer to current row
double x, // Current X position
height, // Height of cell
format_width, // Maximum format width of table
table_width; // Total width of table
// Find all of the rows and columns in the table...
num_cols = num_rows = 0;
memset(cols, 0, sizeof(cols));
memset(rows, 0, sizeof(rows));
rowptr = rows;
for (current = mmdGetFirstChild(table); current && num_rows < TABLEROW_MAX; current = next)
{
next = mmd_walk_next(table, current); next = mmd_walk_next(table, current);
type = mmdGetType(current); type = mmdGetType(current);
if (type == MMD_TYPE_TABLE_ROW) if (type == MMD_TYPE_TABLE_ROW)
{ {
// Parse row... // Parse row...
for (col = 0, current = mmdGetFirstChild(current); current && num_cols < TABLECOL_MAX; current = mmdGetNextSibling(current), col ++) for (col = 0, current = mmdGetFirstChild(current);
current && num_cols < TABLECOL_MAX;
current = mmdGetNextSibling(current), col ++)
{ {
rowptr->cells[col] = current; rowptr->cells[col] = current;
@ -1955,21 +1808,36 @@ format_table(docdata_t *dd, // I - Document data
rowptr ++; rowptr ++;
num_rows ++; num_rows ++;
} }
} }
```
// Figure out the width of each column... The `measure_cell` function also updates the minimum and maximum width needed
for (col = 0, table_width = 0.0; col < num_cols; col ++) for each column. To this we add the cell padding to compute the total table
{ width:
```c
// Figure out the width of each column...
for (col = 0, table_width = 0.0; col < num_cols; col ++)
{
cols[col].max_width += 2.0 * TABLE_PADDING; cols[col].max_width += 2.0 * TABLE_PADDING;
table_width += cols[col].max_width; table_width += cols[col].max_width;
cols[col].width = cols[col].max_width; cols[col].width = cols[col].max_width;
} }
```
format_width = right - left - 2.0 * TABLE_PADDING * num_cols; If the calculated width is more than the available width, we need to adjust the
width of the columns. The algorithm used here breaks the available width into
N equal-width columns - any columns wider than this will be scaled
proportionately. This works out as two steps - one to calculate the the base
width of "narrow" columns and a second to distribute the remaining width amongst
the wider columns:
if (table_width > format_width) ```c
{ format_width = right - left - 2.0 * TABLE_PADDING * num_cols;
if (table_width > format_width)
{
// Content too wide, try scaling the widths... // Content too wide, try scaling the widths...
double avg_width, // Average column width double avg_width, // Average column width
base_width, // Base width base_width, // Base width
@ -2003,37 +1871,48 @@ format_table(docdata_t *dd, // I - Document data
table_width += cols[col].width; table_width += cols[col].width;
} }
} }
```
// Calculate the margins of each column in preparation for formatting Now that we have the widths of the columns, we can calculate the left and right
for (col = 0, x = left + TABLE_PADDING; col < num_cols; col ++) margins of each column for formatting the cell text:
{
```c
// Calculate the margins of each column in preparation for formatting
for (col = 0, x = left + TABLE_PADDING; col < num_cols; col ++)
{
cols[col].left = x; cols[col].left = x;
cols[col].right = x + cols[col].width; cols[col].right = x + cols[col].width;
x += cols[col].width + 2.0 * TABLE_PADDING; x += cols[col].width + 2.0 * TABLE_PADDING;
} }
```
// Calculate the height of each row and cell in preparation for formatting Then we re-measure the cells using the final column widths to determine the
for (row = 0, rowptr = rows; row < num_rows; row ++, rowptr ++) height of each cell and row:
{
```c
// Calculate the height of each row and cell in preparation for formatting
for (row = 0, rowptr = rows; row < num_rows; row ++, rowptr ++)
{
for (col = 0; col < num_cols; col ++) for (col = 0; col < num_cols; col ++)
{ {
height = measure_cell(dd, rowptr->cells[col], cols + col) + 2.0 * TABLE_PADDING; height = measure_cell(dd, rowptr->cells[col], cols + col) + 2.0 * TABLE_PADDING;
if (height > rowptr->height) if (height > rowptr->height)
rowptr->height = height; rowptr->height = height;
} }
}
// Render each table row...
if (dd->st)
dd->y -= SIZE_TABLE * LINE_HEIGHT;
for (row = 0, rowptr = rows; row < num_rows; row ++, rowptr ++)
render_row(dd, num_cols, cols, rowptr);
} }
``` ```
Finally, we render each row in the table:
```c
// Render each table row...
for (row = 0, rowptr = rows; row < num_rows; row ++, rowptr ++)
render_row(dd, num_cols, cols, rowptr);
```
### Rendering the Markdown Document ### Rendering the Markdown Document
The formatted content in arrays of `linefrag_t` and `tablerow_t` structures The formatted content in arrays of `linefrag_t` and `tablerow_t` structures
@ -2109,9 +1988,34 @@ These are later written as annotations in the `add_links` function.
#### Rendering a Table Row #### Rendering a Table Row
The `render_row` function takes a row of cells and the corresponding column The `render_row` function takes a row of cells and the corresponding column
definitions, draws the border boxes around body cells, and then formats each definitions. It starts by drawing the border boxes around body cells:
cell using the `format_block` function described previously. The key is to
reset the page `y` value before formatting each cell: ```c
if (mmdGetType(row->cells[0]) == MMD_TYPE_TABLE_HEADER_CELL)
{
// Header row, no border...
deffont = DOCFONT_BOLD;
}
else
{
// Regular body row, add borders...
deffont = DOCFONT_REGULAR;
set_color(dd, DOCCOLOR_GRAY);
pdfioContentPathRect(dd->st, cols[0].left - TABLE_PADDING, dd->y - row->height,
cols[num_cols - 1].right - cols[0].left +
2.0 * TABLE_PADDING, row->height);
for (col = 1; col < num_cols; col ++)
{
pdfioContentPathMoveTo(dd->st, cols[col].left - TABLE_PADDING, dd->y);
pdfioContentPathLineTo(dd->st, cols[col].left - TABLE_PADDING, dd->y - row->height);
}
pdfioContentStroke(dd->st);
}
```
Then it formats each cell using the `format_block` function described
previously. The page `y` value is reset before formatting each cell:
```c ```c
row_y = dd->y; row_y = dd->y;
@ -2120,7 +2024,8 @@ for (col = 0; col < num_cols; col ++)
{ {
dd->y = row_y; dd->y = row_y;
format_block(dd, row->cells[col], deffont, SIZE_TABLE, cols[col].left, cols[col].right, /*leader*/NULL); format_block(dd, row->cells[col], deffont, SIZE_TABLE, cols[col].left,
cols[col].right, /*leader*/NULL);
} }
dd->y = row_y - row->height; dd->y = row_y - row->height;

View File

@ -218,6 +218,8 @@ static const char * const docfont_names[] =
#define LINE_HEIGHT 1.4 // Multiplier for line height #define LINE_HEIGHT 1.4 // Multiplier for line height
#define LIST_PADDING 36.0 // Padding/indentation for lists
#define SIZE_BODY 11.0 // Size of body text (points) #define SIZE_BODY 11.0 // Size of body text (points)
#define SIZE_CODEBLOCK 10.0 // Size of code block text (points) #define SIZE_CODEBLOCK 10.0 // Size of code block text (points)
#define SIZE_HEADFOOT 9.0 // Size of header/footer text (points) #define SIZE_HEADFOOT 9.0 // Size of header/footer text (points)
@ -260,7 +262,7 @@ static double measure_cell(docdata_t *dd, mmd_t *cell, tablecol_t *col);
static mmd_t *mmd_walk_next(mmd_t *top, mmd_t *node); static mmd_t *mmd_walk_next(mmd_t *top, mmd_t *node);
static void new_page(docdata_t *dd); static void new_page(docdata_t *dd);
static ssize_t output_cb(void *output_cbdata, const void *buffer, size_t bytes); static ssize_t output_cb(void *output_cbdata, const void *buffer, size_t bytes);
static void render_line(docdata_t *dd, double margin_left, double margin_top, double need_bottom, double lineheight, size_t num_frags, linefrag_t *frags); static void render_line(docdata_t *dd, double margin_left, double need_bottom, double lineheight, size_t num_frags, linefrag_t *frags);
static void render_row(docdata_t *dd, size_t num_cols, tablecol_t *cols, tablerow_t *row); static void render_row(docdata_t *dd, size_t num_cols, tablecol_t *cols, tablerow_t *row);
static void set_color(docdata_t *dd, doccolor_t color); static void set_color(docdata_t *dd, doccolor_t color);
static void set_font(docdata_t *dd, docfont_t font, double fsize); static void set_font(docdata_t *dd, docfont_t font, double fsize);
@ -578,7 +580,6 @@ format_block(docdata_t *dd, // I - Document data
width, // Width of current fragment width, // Width of current fragment
wswidth, // Width of whitespace wswidth, // Width of whitespace
margin_left, // Left margin margin_left, // Left margin
margin_top, // Top margin
need_bottom, // Space needed after this block need_bottom, // Space needed after this block
height, // Height of current fragment height, // Height of current fragment
lineheight; // Height of current line lineheight; // Height of current line
@ -586,11 +587,6 @@ format_block(docdata_t *dd, // I - Document data
blocktype = mmdGetType(block); blocktype = mmdGetType(block);
if ((blocktype >= MMD_TYPE_TABLE_HEADER_CELL && blocktype <= MMD_TYPE_TABLE_BODY_CELL_RIGHT) || blocktype == MMD_TYPE_LIST_ITEM)
margin_top = 0.0;
else
margin_top = fsize * LINE_HEIGHT;
if (mmdGetNextSibling(block)) if (mmdGetNextSibling(block))
need_bottom = 3.0 * SIZE_BODY * LINE_HEIGHT; need_bottom = 3.0 * SIZE_BODY * LINE_HEIGHT;
else else
@ -669,7 +665,7 @@ format_block(docdata_t *dd, // I - Document data
else else
margin_left = 0.0; margin_left = 0.0;
render_line(dd, margin_left, margin_top, need_bottom, lineheight, num_frags, frags); render_line(dd, margin_left, need_bottom, lineheight, num_frags, frags);
if (deffont == DOCFONT_ITALIC) if (deffont == DOCFONT_ITALIC)
{ {
@ -683,7 +679,6 @@ format_block(docdata_t *dd, // I - Document data
frag = frags; frag = frags;
x = left; x = left;
lineheight = 0.0; lineheight = 0.0;
margin_top = 0.0;
need_bottom = 0.0; need_bottom = 0.0;
continue; continue;
@ -731,7 +726,13 @@ format_block(docdata_t *dd, // I - Document data
else else
margin_left = 0.0; margin_left = 0.0;
render_line(dd, margin_left, margin_top, need_bottom, lineheight, num_frags, frags); render_line(dd, margin_left, need_bottom, lineheight, num_frags, frags);
num_frags = 0;
frag = frags;
x = left;
lineheight = 0.0;
need_bottom = 0.0;
if (deffont == DOCFONT_ITALIC) if (deffont == DOCFONT_ITALIC)
{ {
@ -744,18 +745,12 @@ format_block(docdata_t *dd, // I - Document data
pdfioContentStroke(dd->st); pdfioContentStroke(dd->st);
pdfioContentRestore(dd->st); pdfioContentRestore(dd->st);
} }
num_frags = 0;
frag = frags;
x = left;
lineheight = 0.0;
margin_top = 0.0;
need_bottom = 0.0;
} }
// Add the current node to the fragment list // Add the current node to the fragment list
if (num_frags == 0) if (num_frags == 0)
{ {
// No leading whitespace at the start of the line
ws = false; ws = false;
wswidth = 0.0; wswidth = 0.0;
} }
@ -787,7 +782,7 @@ format_block(docdata_t *dd, // I - Document data
else else
margin_left = 0.0; margin_left = 0.0;
render_line(dd, margin_left, margin_top, need_bottom, lineheight, num_frags, frags); render_line(dd, margin_left, need_bottom, lineheight, num_frags, frags);
if (deffont == DOCFONT_ITALIC) if (deffont == DOCFONT_ITALIC)
{ {
@ -815,23 +810,17 @@ format_code(docdata_t *dd, // I - Document data
double right) // I - Right margin double right) // I - Right margin
{ {
mmd_t *code; // Current code block mmd_t *code; // Current code block
double lineheight, // Line height double lineheight; // Line height
margin_top; // Top margin
// Compute line height and initial top margin... // Compute line height...
lineheight = SIZE_CODEBLOCK * LINE_HEIGHT; lineheight = SIZE_CODEBLOCK * LINE_HEIGHT;
margin_top = lineheight;
// Start a new page as needed... // Start a new page as needed...
if (!dd->st) if (!dd->st)
{
new_page(dd); new_page(dd);
margin_top = 0.0; dd->y -= lineheight + CODE_PADDING;
}
dd->y -= lineheight + margin_top + CODE_PADDING;
if ((dd->y - lineheight) < dd->art_box.y1) if ((dd->y - lineheight) < dd->art_box.y1)
{ {
@ -934,10 +923,9 @@ format_doc(docdata_t *dd, // I - Document data
case MMD_TYPE_ORDERED_LIST : case MMD_TYPE_ORDERED_LIST :
case MMD_TYPE_UNORDERED_LIST : case MMD_TYPE_UNORDERED_LIST :
if (dd->st)
dd->y -= SIZE_BODY * LINE_HEIGHT; dd->y -= SIZE_BODY * LINE_HEIGHT;
format_doc(dd, current, deffont, left + 36.0, right); format_doc(dd, current, deffont, left + LIST_PADDING, right);
break; break;
case MMD_TYPE_LIST_ITEM : case MMD_TYPE_LIST_ITEM :
@ -958,12 +946,17 @@ format_doc(docdata_t *dd, // I - Document data
case MMD_TYPE_HEADING_4 : case MMD_TYPE_HEADING_4 :
case MMD_TYPE_HEADING_5 : case MMD_TYPE_HEADING_5 :
case MMD_TYPE_HEADING_6 : case MMD_TYPE_HEADING_6 :
// Update the current heading
free(dd->heading); free(dd->heading);
dd->heading = mmdCopyAllText(current); dd->heading = mmdCopyAllText(current);
// Add a blank line before the heading...
dd->y -= heading_sizes[curtype - MMD_TYPE_HEADING_1] * LINE_HEIGHT;
// Format the heading...
format_block(dd, current, DOCFONT_BOLD, heading_sizes[curtype - MMD_TYPE_HEADING_1], left, right, /*leader*/NULL); format_block(dd, current, DOCFONT_BOLD, heading_sizes[curtype - MMD_TYPE_HEADING_1], left, right, /*leader*/NULL);
// Add the heading to the table-of-contents...
if (dd->num_toc < DOCTOC_MAX) if (dd->num_toc < DOCTOC_MAX)
{ {
doctoc_t *t = dd->toc + dd->num_toc; doctoc_t *t = dd->toc + dd->num_toc;
@ -987,6 +980,7 @@ format_doc(docdata_t *dd, // I - Document data
dd->num_toc ++; dd->num_toc ++;
} }
// Add the heading to the list of link targets...
if (dd->num_targets < DOCTARGET_MAX) if (dd->num_targets < DOCTARGET_MAX)
{ {
doctarget_t *t = dd->targets + dd->num_targets; doctarget_t *t = dd->targets + dd->num_targets;
@ -1001,14 +995,26 @@ format_doc(docdata_t *dd, // I - Document data
break; break;
case MMD_TYPE_PARAGRAPH : case MMD_TYPE_PARAGRAPH :
// Add a blank line before the paragraph...
dd->y -= SIZE_BODY * LINE_HEIGHT;
// Format the paragraph...
format_block(dd, current, deffont, SIZE_BODY, left, right, /*leader*/NULL); format_block(dd, current, deffont, SIZE_BODY, left, right, /*leader*/NULL);
break; break;
case MMD_TYPE_TABLE : case MMD_TYPE_TABLE :
// Add a blank line before the paragraph...
dd->y -= SIZE_BODY * LINE_HEIGHT;
// Format the table...
format_table(dd, current, left, right); format_table(dd, current, left, right);
break; break;
case MMD_TYPE_CODE_BLOCK : case MMD_TYPE_CODE_BLOCK :
// Add a blank line before the code block...
dd->y -= SIZE_BODY * LINE_HEIGHT;
// Format the code block...
format_code(dd, current, left + CODE_PADDING, right - CODE_PADDING); format_code(dd, current, left + CODE_PADDING, right - CODE_PADDING);
break; break;
} }
@ -1043,14 +1049,10 @@ format_table(docdata_t *dd, // I - Document data
// Find all of the rows and columns in the table... // Find all of the rows and columns in the table...
num_cols = num_rows = 0;
memset(cols, 0, sizeof(cols)); memset(cols, 0, sizeof(cols));
memset(rows, 0, sizeof(rows)); memset(rows, 0, sizeof(rows));
rowptr = rows; for (num_cols = 0, num_rows = 0, rowptr = rows, current = mmdGetFirstChild(table); current && num_rows < TABLEROW_MAX; current = next)
for (current = mmdGetFirstChild(table); current && num_rows < TABLEROW_MAX; current = next)
{ {
next = mmd_walk_next(table, current); next = mmd_walk_next(table, current);
type = mmdGetType(current); type = mmdGetType(current);
@ -1142,9 +1144,6 @@ format_table(docdata_t *dd, // I - Document data
} }
// Render each table row... // Render each table row...
if (dd->st)
dd->y -= SIZE_TABLE * LINE_HEIGHT;
for (row = 0, rowptr = rows; row < num_rows; row ++, rowptr ++) for (row = 0, rowptr = rows; row < num_rows; row ++, rowptr ++)
render_row(dd, num_cols, cols, rowptr); render_row(dd, num_cols, cols, rowptr);
} }
@ -1471,7 +1470,6 @@ output_cb(void *output_cbdata, // I - Callback data (not used)
static void static void
render_line(docdata_t *dd, // I - Document data render_line(docdata_t *dd, // I - Document data
double margin_left, // I - Left margin double margin_left, // I - Left margin
double margin_top, // I - Top margin
double need_bottom, // I - How much space is needed after double need_bottom, // I - How much space is needed after
double lineheight, // I - Height of line double lineheight, // I - Height of line
size_t num_frags, // I - Number of line fragments size_t num_frags, // I - Number of line fragments
@ -1483,12 +1481,9 @@ render_line(docdata_t *dd, // I - Document data
if (!dd->st) if (!dd->st)
{
new_page(dd); new_page(dd);
margin_top = 0.0;
}
dd->y -= margin_top + lineheight; dd->y -= lineheight;
if ((dd->y - need_bottom) < dd->art_box.y1) if ((dd->y - need_bottom) < dd->art_box.y1)
{ {
new_page(dd); new_page(dd);