diff options
author | Tor Andersson <tor.andersson@artifex.com> | 2015-02-23 15:00:56 +0100 |
---|---|---|
committer | Tor Andersson <tor.andersson@artifex.com> | 2015-02-23 15:00:56 +0100 |
commit | 119552f74c71c24698f4b424411786bfb4baea6b (patch) | |
tree | bf312c79c7fe6fcb819c6f1b8e3cc9f8e4888e0e /source/html/html-doc.c | |
parent | 241f8b6c35895b932ac7f27de1ee76416cae419a (diff) | |
parent | fe05bc51ee70190516d6cc65f03e343bfdc4f849 (diff) | |
download | mupdf-119552f74c71c24698f4b424411786bfb4baea6b.tar.xz |
Merge branch 'html'
Conflicts:
Makefile
Diffstat (limited to 'source/html/html-doc.c')
-rw-r--r-- | source/html/html-doc.c | 166 |
1 files changed, 166 insertions, 0 deletions
diff --git a/source/html/html-doc.c b/source/html/html-doc.c new file mode 100644 index 00000000..7217f74c --- /dev/null +++ b/source/html/html-doc.c @@ -0,0 +1,166 @@ +#include "mupdf/html.h" + +#define DEFW (450) +#define DEFH (600) +#define DEFEM (12) + +typedef struct html_document_s html_document; +typedef struct html_page_s html_page; + +struct html_document_s +{ + fz_document super; + fz_archive *zip; + fz_html_font_set *set; + float page_w, page_h, em; + fz_html *box; +}; + +struct html_page_s +{ + fz_page super; + html_document *doc; + int number; +}; + +static void +htdoc_close_document(fz_context *ctx, fz_document *doc_) +{ + html_document *doc = (html_document*)doc_; + fz_drop_archive(ctx, doc->zip); + fz_drop_html(ctx, doc->box); + fz_drop_html_font_set(ctx, doc->set); + fz_free(ctx, doc); +} + +static int +htdoc_count_pages(fz_context *ctx, fz_document *doc_) +{ + html_document *doc = (html_document*)doc_; + int count = ceilf(doc->box->h / doc->page_h); + return count; +} + +static void +htdoc_layout(fz_context *ctx, fz_document *doc_, float w, float h, float em) +{ + html_document *doc = (html_document*)doc_; + doc->page_w = w; + doc->page_h = h; + doc->em = em; + fz_layout_html(ctx, doc->box, w, h, em); +} + +static void +htdoc_drop_page_imp(fz_context *ctx, fz_page *page_) +{ +} + +static fz_rect * +htdoc_bound_page(fz_context *ctx, fz_page *page_, fz_rect *bbox) +{ + html_page *page = (html_page*)page_; + html_document *doc = page->doc; + bbox->x0 = bbox->y0 = 0; + bbox->x1 = doc->page_w; + bbox->y1 = doc->page_h; + return bbox; +} + +static void +htdoc_run_page(fz_context *ctx, fz_page *page_, fz_device *dev, const fz_matrix *ctm, fz_cookie *cookie) +{ + html_page *page = (html_page*)page_; + html_document *doc = page->doc; + int n = page->number; + fz_draw_html(ctx, doc->box, n * doc->page_h, (n+1) * doc->page_h, dev, ctm); +} + +static fz_page * +htdoc_load_page(fz_context *ctx, fz_document *doc_, int number) +{ + html_document *doc = (html_document*)doc_; + html_page *page = fz_new_page(ctx, sizeof *page); + page->super.bound_page = htdoc_bound_page; + page->super.run_page_contents = htdoc_run_page; + page->super.drop_page_imp = htdoc_drop_page_imp; + page->doc = doc; + page->number = number; + return (fz_page*)page; +} + +static html_document * +htdoc_open_document_with_stream(fz_context *ctx, fz_stream *file) +{ + html_document *doc; + fz_buffer *buf; + + doc = fz_malloc_struct(ctx, html_document); + doc->zip = fz_open_directory(ctx, "."); + doc->set = fz_new_html_font_set(ctx); + + doc->super.close = htdoc_close_document; + doc->super.layout = htdoc_layout; + doc->super.count_pages = htdoc_count_pages; + doc->super.load_page = htdoc_load_page; + + buf = fz_read_all(ctx, file, 0); + fz_write_buffer_byte(ctx, buf, 0); + doc->box = fz_parse_html(ctx, doc->set, doc->zip, ".", buf, NULL); + fz_drop_buffer(ctx, buf); + + htdoc_layout(ctx, (fz_document*)doc, DEFW, DEFH, DEFEM); + + return doc; +} + +static html_document * +htdoc_open_document(fz_context *ctx, const char *filename) +{ + char dirname[2048]; + fz_buffer *buf; + html_document *doc; + + fz_dirname(dirname, filename, sizeof dirname); + + doc = fz_malloc_struct(ctx, html_document); + doc->zip = fz_open_directory(ctx, dirname); + doc->set = fz_new_html_font_set(ctx); + + doc->super.close = htdoc_close_document; + doc->super.layout = htdoc_layout; + doc->super.count_pages = htdoc_count_pages; + doc->super.load_page = htdoc_load_page; + + buf = fz_read_file(ctx, filename); + fz_write_buffer_byte(ctx, buf, 0); + doc->box = fz_parse_html(ctx, doc->set, doc->zip, ".", buf, NULL); + fz_drop_buffer(ctx, buf); + + htdoc_layout(ctx, (fz_document*)doc, DEFW, DEFH, DEFEM); + + return doc; +} + +static int +htdoc_recognize(fz_context *doc, const char *magic) +{ + char *ext = strrchr(magic, '.'); + + if (ext) + { + if (!fz_strcasecmp(ext, ".xml") || !fz_strcasecmp(ext, ".xhtml") || !fz_strcasecmp(ext, ".html")) + return 100; + } + if (!strcmp(magic, "application/html+xml") || !strcmp(magic, "application/xml") || !strcmp(magic, "text/xml")) + return 100; + + return 0; +} + +fz_document_handler html_document_handler = +{ + (fz_document_recognize_fn *)&htdoc_recognize, + (fz_document_open_fn *)&htdoc_open_document, + (fz_document_open_with_stream_fn *)&htdoc_open_document_with_stream +}; |