#include "mupdf/html.h" enum { T, R, B, L }; typedef struct html_document_s html_document; typedef struct html_page_s html_page; struct html_document_s { fz_document super; fz_archive *zip; fz_html_font_set *set; fz_html *html; }; struct html_page_s { fz_page super; html_document *doc; int number; }; static void htdoc_drop_document(fz_context *ctx, fz_document *doc_) { html_document *doc = (html_document*)doc_; fz_drop_archive(ctx, doc->zip); fz_drop_html(ctx, doc->html); fz_drop_html_font_set(ctx, doc->set); } static int htdoc_resolve_link(fz_context *ctx, fz_document *doc_, const char *dest, float *xp, float *yp) { html_document *doc = (html_document*)doc_; const char *s = strchr(dest, '#'); if (s && s[1] != 0) { float y = fz_find_html_target(ctx, doc->html, s+1); if (y >= 0) { int page = y / doc->html->page_h; if (yp) *yp = y - page * doc->html->page_h; return page; } } return -1; } static int htdoc_count_pages(fz_context *ctx, fz_document *doc_) { html_document *doc = (html_document*)doc_; int count = ceilf(doc->html->root->h / doc->html->page_h); return count; } static void htdoc_layout(fz_context *ctx, fz_document *doc_, float w, float h, float em) { html_document *doc = (html_document*)doc_; fz_layout_html(ctx, doc->html, w, h, em); } static void htdoc_drop_page(fz_context *ctx, fz_page *page_) { } static fz_rect * htdoc_bound_page(fz_context *ctx, fz_page *page_, fz_rect *bbox) { html_page *page = (html_page*)page_; html_document *doc = page->doc; bbox->x0 = 0; bbox->y0 = 0; bbox->x1 = doc->html->page_w + doc->html->page_margin[L] + doc->html->page_margin[R]; bbox->y1 = doc->html->page_h + doc->html->page_margin[T] + doc->html->page_margin[B]; return bbox; } static void htdoc_run_page(fz_context *ctx, fz_page *page_, fz_device *dev, const fz_matrix *ctm, fz_cookie *cookie) { html_page *page = (html_page*)page_; html_document *doc = page->doc; fz_draw_html(ctx, dev, ctm, doc->html, page->number); } static fz_link * htdoc_load_links(fz_context *ctx, fz_page *page_) { html_page *page = (html_page*)page_; html_document *doc = page->doc; return fz_load_html_links(ctx, doc->html, page->number, "", doc); } static fz_bookmark htdoc_make_bookmark(fz_context *ctx, fz_document *doc_, int page) { html_document *doc = (html_document*)doc_; return fz_make_html_bookmark(ctx, doc->html, page); } static int htdoc_lookup_bookmark(fz_context *ctx, fz_document *doc_, fz_bookmark mark) { html_document *doc = (html_document*)doc_; return fz_lookup_html_bookmark(ctx, doc->html, mark); } static fz_page * htdoc_load_page(fz_context *ctx, fz_document *doc_, int number) { html_document *doc = (html_document*)doc_; html_page *page = fz_new_derived_page(ctx, html_page); page->super.bound_page = htdoc_bound_page; page->super.run_page_contents = htdoc_run_page; page->super.load_links = htdoc_load_links; page->super.drop_page = htdoc_drop_page; page->doc = doc; page->number = number; return (fz_page*)page; } static int htdoc_lookup_metadata(fz_context *ctx, fz_document *doc_, const char *key, char *buf, int size) { if (!strcmp(key, "format")) return (int)fz_strlcpy(buf, "XHTML", size); return -1; } static fz_document * htdoc_open_document_with_stream(fz_context *ctx, fz_stream *file) { html_document *doc; fz_buffer *buf; doc = fz_new_derived_document(ctx, html_document); doc->super.drop_document = htdoc_drop_document; doc->super.layout = htdoc_layout; doc->super.resolve_link = htdoc_resolve_link; doc->super.count_pages = htdoc_count_pages; doc->super.load_page = htdoc_load_page; doc->super.lookup_metadata = htdoc_lookup_metadata; doc->super.is_reflowable = 1; doc->zip = fz_open_directory(ctx, "."); doc->set = fz_new_html_font_set(ctx); buf = fz_read_all(ctx, file, 0); fz_try(ctx) doc->html = fz_parse_html(ctx, doc->set, doc->zip, ".", buf, fz_user_css(ctx)); fz_always(ctx) fz_drop_buffer(ctx, buf); fz_catch(ctx) fz_rethrow(ctx); return (fz_document*)doc; } static fz_document * htdoc_open_document(fz_context *ctx, const char *filename) { char dirname[2048]; fz_buffer *buf; html_document *doc; fz_dirname(dirname, filename, sizeof dirname); doc = fz_new_derived_document(ctx, html_document); doc->super.drop_document = htdoc_drop_document; doc->super.layout = htdoc_layout; doc->super.resolve_link = htdoc_resolve_link; doc->super.make_bookmark = htdoc_make_bookmark; doc->super.lookup_bookmark = htdoc_lookup_bookmark; doc->super.count_pages = htdoc_count_pages; doc->super.load_page = htdoc_load_page; doc->super.lookup_metadata = htdoc_lookup_metadata; doc->super.is_reflowable = 1; doc->zip = fz_open_directory(ctx, dirname); doc->set = fz_new_html_font_set(ctx); buf = fz_read_file(ctx, filename); fz_try(ctx) doc->html = fz_parse_html(ctx, doc->set, doc->zip, ".", buf, fz_user_css(ctx)); fz_always(ctx) fz_drop_buffer(ctx, buf); fz_catch(ctx) fz_rethrow(ctx); return (fz_document*)doc; } static int htdoc_recognize(fz_context *doc, const char *magic) { char *ext = strrchr(magic, '.'); if (ext) { if (!fz_strcasecmp(ext, ".xml") || !fz_strcasecmp(ext, ".xhtml") || !fz_strcasecmp(ext, ".html") || !fz_strcasecmp(ext, ".htm") || !fz_strcasecmp(ext, ".fb2")) return 100; } if (!strcmp(magic, "application/html+xml") || !strcmp(magic, "application/xml") || !strcmp(magic, "text/xml")) return 100; return 0; } fz_document_handler html_document_handler = { &htdoc_recognize, &htdoc_open_document, &htdoc_open_document_with_stream };