From 85ee87997e3ee4eb579084f92d109b9b78dcf9c7 Mon Sep 17 00:00:00 2001 From: Tor Andersson Date: Thu, 25 Aug 2016 12:44:13 +0200 Subject: Use U+FFFD instead of '?' for bad encodings in text extraction. --- source/pdf/pdf-unicode.c | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) (limited to 'source/pdf/pdf-unicode.c') diff --git a/source/pdf/pdf-unicode.c b/source/pdf/pdf-unicode.c index ca84341d..65bda460 100644 --- a/source/pdf/pdf-unicode.c +++ b/source/pdf/pdf-unicode.c @@ -96,7 +96,7 @@ pdf_load_to_unicode(fz_context *ctx, pdf_document *doc, pdf_font_desc *font, if (strings[cpt]) font->cid_to_ucs[cpt] = pdf_lookup_agl(strings[cpt]); else - font->cid_to_ucs[cpt] = '?'; + font->cid_to_ucs[cpt] = 0xFFFD; /* replacement character */ } } -- cgit v1.2.3