#include "mupdf/html.h" enum { T, R, B, L }; typedef struct html_document_s html_document; typedef struct html_page_s html_page; struct html_document_s { fz_document super; fz_archive *zip; fz_html_font_set *set; float page_w, page_h, em; float page_margin[4]; fz_html *box; }; struct html_page_s { fz_page super; html_document *doc; int number; }; static void htdoc_close_document(fz_context *ctx, fz_document *doc_) { html_document *doc = (html_document*)doc_; fz_drop_archive(ctx, doc->zip); fz_drop_html(ctx, doc->box); fz_drop_html_font_set(ctx, doc->set); fz_free(ctx, doc); } static int htdoc_count_pages(fz_context *ctx, fz_document *doc_) { html_document *doc = (html_document*)doc_; int count = ceilf(doc->box->h / doc->page_h); return count; } static void htdoc_layout(fz_context *ctx, fz_document *doc_, float w, float h, float em) { html_document *doc = (html_document*)doc_; if (doc->box) { doc->page_margin[T] = fz_from_css_number(doc->box->style.margin[T], em, em); doc->page_margin[B] = fz_from_css_number(doc->box->style.margin[B], em, em); doc->page_margin[L] = fz_from_css_number(doc->box->style.margin[L], em, em); doc->page_margin[R] = fz_from_css_number(doc->box->style.margin[R], em, em); } doc->page_w = w - doc->page_margin[L] - doc->page_margin[R]; doc->page_h = h - doc->page_margin[T] - doc->page_margin[B]; doc->em = em; fz_layout_html(ctx, doc->box, doc->page_w, doc->page_h, doc->em); } static void htdoc_drop_page_imp(fz_context *ctx, fz_page *page_) { } static fz_rect * htdoc_bound_page(fz_context *ctx, fz_page *page_, fz_rect *bbox) { html_page *page = (html_page*)page_; html_document *doc = page->doc; bbox->x0 = 0; bbox->y0 = 0; bbox->x1 = doc->page_w + doc->page_margin[L] + doc->page_margin[R]; bbox->y1 = doc->page_h + doc->page_margin[T] + doc->page_margin[B]; return bbox; } static void htdoc_run_page(fz_context *ctx, fz_page *page_, fz_device *dev, const fz_matrix *ctm, fz_cookie *cookie) { html_page *page = (html_page*)page_; html_document *doc = page->doc; fz_matrix local_ctm = *ctm; int n = page->number; fz_pre_translate(&local_ctm, doc->page_margin[L], doc->page_margin[T]); fz_draw_html(ctx, doc->box, n * doc->page_h, (n+1) * doc->page_h, dev, &local_ctm); } static fz_page * htdoc_load_page(fz_context *ctx, fz_document *doc_, int number) { html_document *doc = (html_document*)doc_; html_page *page = fz_new_page(ctx, sizeof *page); page->super.bound_page = htdoc_bound_page; page->super.run_page_contents = htdoc_run_page; page->super.drop_page_imp = htdoc_drop_page_imp; page->doc = doc; page->number = number; return (fz_page*)page; } static fz_document * htdoc_open_document_with_stream(fz_context *ctx, fz_stream *file) { html_document *doc; fz_buffer *buf; doc = fz_malloc_struct(ctx, html_document); doc->super.close = htdoc_close_document; doc->super.layout = htdoc_layout; doc->super.count_pages = htdoc_count_pages; doc->super.load_page = htdoc_load_page; doc->zip = fz_open_directory(ctx, "."); doc->set = fz_new_html_font_set(ctx); buf = fz_read_all(ctx, file, 0); fz_write_buffer_byte(ctx, buf, 0); doc->box = fz_parse_html(ctx, doc->set, doc->zip, ".", buf, fz_user_css(ctx)); fz_drop_buffer(ctx, buf); return (fz_document*)doc; } static fz_document * htdoc_open_document(fz_context *ctx, const char *filename) { char dirname[2048]; fz_buffer *buf; html_document *doc; fz_dirname(dirname, filename, sizeof dirname); doc = fz_malloc_struct(ctx, html_document); doc->super.close = htdoc_close_document; doc->super.layout = htdoc_layout; doc->super.count_pages = htdoc_count_pages; doc->super.load_page = htdoc_load_page; doc->zip = fz_open_directory(ctx, dirname); doc->set = fz_new_html_font_set(ctx); buf = fz_read_file(ctx, filename); fz_write_buffer_byte(ctx, buf, 0); doc->box = fz_parse_html(ctx, doc->set, doc->zip, ".", buf, fz_user_css(ctx)); fz_drop_buffer(ctx, buf); return (fz_document*)doc; } static int htdoc_recognize(fz_context *doc, const char *magic) { char *ext = strrchr(magic, '.'); if (ext) { if (!fz_strcasecmp(ext, ".xml") || !fz_strcasecmp(ext, ".xhtml") || !fz_strcasecmp(ext, ".html") || !fz_strcasecmp(ext, ".htm")) return 100; } if (!strcmp(magic, "application/html+xml") || !strcmp(magic, "application/xml") || !strcmp(magic, "text/xml")) return 100; return 0; } fz_document_handler html_document_handler = { &htdoc_recognize, &htdoc_open_document, &htdoc_open_document_with_stream };