#include "mupdf/html.h"
#define DEFW (450)
#define DEFH (600)
#define DEFEM (12)
typedef struct html_document_s html_document;
typedef struct html_page_s html_page;
struct html_document_s
{
fz_document super;
fz_archive *zip;
fz_html_font_set *set;
float page_w, page_h, em;
fz_html *box;
};
struct html_page_s
{
fz_page super;
html_document *doc;
int number;
};
static void
htdoc_close_document(fz_context *ctx, fz_document *doc_)
{
html_document *doc = (html_document*)doc_;
fz_drop_archive(ctx, doc->zip);
fz_drop_html(ctx, doc->box);
fz_drop_html_font_set(ctx, doc->set);
fz_free(ctx, doc);
}
static int
htdoc_count_pages(fz_context *ctx, fz_document *doc_)
{
html_document *doc = (html_document*)doc_;
int count = ceilf(doc->box->h / doc->page_h);
return count;
}
static void
htdoc_layout(fz_context *ctx, fz_document *doc_, float w, float h, float em)
{
html_document *doc = (html_document*)doc_;
doc->page_w = w;
doc->page_h = h;
doc->em = em;
fz_layout_html(ctx, doc->box, w, h, em);
}
static void
htdoc_drop_page_imp(fz_context *ctx, fz_page *page_)
{
}
static fz_rect *
htdoc_bound_page(fz_context *ctx, fz_page *page_, fz_rect *bbox)
{
html_page *page = (html_page*)page_;
html_document *doc = page->doc;
bbox->x0 = bbox->y0 = 0;
bbox->x1 = doc->page_w;
bbox->y1 = doc->page_h;
return bbox;
}
static void
htdoc_run_page(fz_context *ctx, fz_page *page_, fz_device *dev, const fz_matrix *ctm, fz_cookie *cookie)
{
html_page *page = (html_page*)page_;
html_document *doc = page->doc;
int n = page->number;
fz_draw_html(ctx, doc->box, n * doc->page_h, (n+1) * doc->page_h, dev, ctm);
}
static fz_page *
htdoc_load_page(fz_context *ctx, fz_document *doc_, int number)
{
html_document *doc = (html_document*)doc_;
html_page *page = fz_new_page(ctx, sizeof *page);
page->super.bound_page = htdoc_bound_page;
page->super.run_page_contents = htdoc_run_page;
page->super.drop_page_imp = htdoc_drop_page_imp;
page->doc = doc;
page->number = number;
return (fz_page*)page;
}
static fz_document *
htdoc_open_document_with_stream(fz_context *ctx, fz_stream *file)
{
html_document *doc;
fz_buffer *buf;
doc = fz_malloc_struct(ctx, html_document);
doc->super.close = htdoc_close_document;
doc->super.layout = htdoc_layout;
doc->super.count_pages = htdoc_count_pages;
doc->super.load_page = htdoc_load_page;
doc->zip = fz_open_directory(ctx, ".");
doc->set = fz_new_html_font_set(ctx);
buf = fz_read_all(ctx, file, 0);
fz_write_buffer_byte(ctx, buf, 0);
doc->box = fz_parse_html(ctx, doc->set, doc->zip, ".", buf, NULL);
fz_drop_buffer(ctx, buf);
htdoc_layout(ctx, (fz_document*)doc, DEFW, DEFH, DEFEM);
return (fz_document*)doc;
}
static fz_document *
htdoc_open_document(fz_context *ctx, const char *filename)
{
char dirname[2048];
fz_buffer *buf;
html_document *doc;
fz_dirname(dirname, filename, sizeof dirname);
doc = fz_malloc_struct(ctx, html_document);
doc->super.close = htdoc_close_document;
doc->super.layout = htdoc_layout;
doc->super.count_pages = htdoc_count_pages;
doc->super.load_page = htdoc_load_page;
doc->zip = fz_open_directory(ctx, dirname);
doc->set = fz_new_html_font_set(ctx);
buf = fz_read_file(ctx, filename);
fz_write_buffer_byte(ctx, buf, 0);
doc->box = fz_parse_html(ctx, doc->set, doc->zip, ".", buf, NULL);
fz_drop_buffer(ctx, buf);
htdoc_layout(ctx, (fz_document*)doc, DEFW, DEFH, DEFEM);
return (fz_document*)doc;
}
static int
htdoc_recognize(fz_context *doc, const char *magic)
{
char *ext = strrchr(magic, '.');
if (ext)
{
if (!fz_strcasecmp(ext, ".xml") || !fz_strcasecmp(ext, ".xhtml") || !fz_strcasecmp(ext, ".html"))
return 100;
}
if (!strcmp(magic, "application/html+xml") || !strcmp(magic, "application/xml") || !strcmp(magic, "text/xml"))
return 100;
return 0;
}
fz_document_handler html_document_handler =
{
&htdoc_recognize,
&htdoc_open_document,
&htdoc_open_document_with_stream
};