summaryrefslogtreecommitdiff
path: root/source/pdf/pdf-crypt.c
diff options
context:
space:
mode:
authorTor Andersson <tor.andersson@artifex.com>2013-06-19 15:29:44 +0200
committerTor Andersson <tor.andersson@artifex.com>2013-06-20 16:45:35 +0200
commit0a927854a10e1e6b9770a81e2e1d9f3093631757 (patch)
tree3d65d820d9fdba2d0d394d99c36290c851b78ca0 /source/pdf/pdf-crypt.c
parent1ae8f19179c5f0f8c6352b3c7855465325d5449a (diff)
downloadmupdf-0a927854a10e1e6b9770a81e2e1d9f3093631757.tar.xz
Rearrange source files.
Diffstat (limited to 'source/pdf/pdf-crypt.c')
-rw-r--r--source/pdf/pdf-crypt.c1010
1 files changed, 1010 insertions, 0 deletions
diff --git a/source/pdf/pdf-crypt.c b/source/pdf/pdf-crypt.c
new file mode 100644
index 00000000..5128473c
--- /dev/null
+++ b/source/pdf/pdf-crypt.c
@@ -0,0 +1,1010 @@
+#include "mupdf/pdf.h"
+
+enum
+{
+ PDF_CRYPT_NONE,
+ PDF_CRYPT_RC4,
+ PDF_CRYPT_AESV2,
+ PDF_CRYPT_AESV3,
+ PDF_CRYPT_UNKNOWN,
+};
+
+typedef struct pdf_crypt_filter_s pdf_crypt_filter;
+
+struct pdf_crypt_filter_s
+{
+ int method;
+ int length;
+};
+
+struct pdf_crypt_s
+{
+ pdf_obj *id;
+
+ int v;
+ int length;
+ pdf_obj *cf;
+ pdf_crypt_filter stmf;
+ pdf_crypt_filter strf;
+
+ int r;
+ unsigned char o[48];
+ unsigned char u[48];
+ unsigned char oe[32];
+ unsigned char ue[32];
+ int p;
+ int encrypt_metadata;
+
+ unsigned char key[32]; /* decryption key generated from password */
+ fz_context *ctx;
+};
+
+static void pdf_parse_crypt_filter(fz_context *ctx, pdf_crypt_filter *cf, pdf_crypt *crypt, char *name);
+
+/*
+ * Create crypt object for decrypting strings and streams
+ * given the Encryption and ID objects.
+ */
+
+pdf_crypt *
+pdf_new_crypt(fz_context *ctx, pdf_obj *dict, pdf_obj *id)
+{
+ pdf_crypt *crypt;
+ pdf_obj *obj;
+
+ crypt = fz_malloc_struct(ctx, pdf_crypt);
+
+ /* Common to all security handlers (PDF 1.7 table 3.18) */
+
+ obj = pdf_dict_gets(dict, "Filter");
+ if (!pdf_is_name(obj))
+ {
+ pdf_free_crypt(ctx, crypt);
+ fz_throw(ctx, FZ_ERROR_GENERIC, "unspecified encryption handler");
+ }
+ if (strcmp(pdf_to_name(obj), "Standard") != 0)
+ {
+ pdf_free_crypt(ctx, crypt);
+ fz_throw(ctx, FZ_ERROR_GENERIC, "unknown encryption handler: '%s'", pdf_to_name(obj));
+ }
+
+ crypt->v = 0;
+ obj = pdf_dict_gets(dict, "V");
+ if (pdf_is_int(obj))
+ crypt->v = pdf_to_int(obj);
+ if (crypt->v != 1 && crypt->v != 2 && crypt->v != 4 && crypt->v != 5)
+ {
+ pdf_free_crypt(ctx, crypt);
+ fz_throw(ctx, FZ_ERROR_GENERIC, "unknown encryption version");
+ }
+
+ /* Standard security handler (PDF 1.7 table 3.19) */
+
+ obj = pdf_dict_gets(dict, "R");
+ if (pdf_is_int(obj))
+ crypt->r = pdf_to_int(obj);
+ else if (crypt->v <= 4)
+ {
+ fz_warn(ctx, "encryption dictionary missing revision value, guessing...");
+ if (crypt->v < 2)
+ crypt->r = 2;
+ else if (crypt->v == 2)
+ crypt->r = 3;
+ else if (crypt->v == 4)
+ crypt->r = 4;
+ }
+ else
+ {
+ pdf_free_crypt(ctx, crypt);
+ fz_throw(ctx, FZ_ERROR_GENERIC, "encryption dictionary missing version and revision value");
+ }
+
+ obj = pdf_dict_gets(dict, "O");
+ if (pdf_is_string(obj) && pdf_to_str_len(obj) == 32)
+ memcpy(crypt->o, pdf_to_str_buf(obj), 32);
+ /* /O and /U are supposed to be 48 bytes long for revision 5 and 6, they're often longer, though */
+ else if (crypt->r >= 5 && pdf_is_string(obj) && pdf_to_str_len(obj) >= 48)
+ memcpy(crypt->o, pdf_to_str_buf(obj), 48);
+ else
+ {
+ pdf_free_crypt(ctx, crypt);
+ fz_throw(ctx, FZ_ERROR_GENERIC, "encryption dictionary missing owner password");
+ }
+
+ obj = pdf_dict_gets(dict, "U");
+ if (pdf_is_string(obj) && pdf_to_str_len(obj) == 32)
+ memcpy(crypt->u, pdf_to_str_buf(obj), 32);
+ /* /O and /U are supposed to be 48 bytes long for revision 5 and 6, they're often longer, though */
+ else if (crypt->r >= 5 && pdf_is_string(obj) && pdf_to_str_len(obj) >= 48)
+ memcpy(crypt->u, pdf_to_str_buf(obj), 48);
+ else if (pdf_is_string(obj) && pdf_to_str_len(obj) < 32)
+ {
+ fz_warn(ctx, "encryption password key too short (%d)", pdf_to_str_len(obj));
+ memcpy(crypt->u, pdf_to_str_buf(obj), pdf_to_str_len(obj));
+ }
+ else
+ {
+ pdf_free_crypt(ctx, crypt);
+ fz_throw(ctx, FZ_ERROR_GENERIC, "encryption dictionary missing user password");
+ }
+
+ obj = pdf_dict_gets(dict, "P");
+ if (pdf_is_int(obj))
+ crypt->p = pdf_to_int(obj);
+ else
+ {
+ fz_warn(ctx, "encryption dictionary missing permissions");
+ crypt->p = 0xfffffffc;
+ }
+
+ if (crypt->r == 5 || crypt->r == 6)
+ {
+ obj = pdf_dict_gets(dict, "OE");
+ if (!pdf_is_string(obj) || pdf_to_str_len(obj) != 32)
+ {
+ pdf_free_crypt(ctx, crypt);
+ fz_throw(ctx, FZ_ERROR_GENERIC, "encryption dictionary missing owner encryption key");
+ }
+ memcpy(crypt->oe, pdf_to_str_buf(obj), 32);
+
+ obj = pdf_dict_gets(dict, "UE");
+ if (!pdf_is_string(obj) || pdf_to_str_len(obj) != 32)
+ {
+ pdf_free_crypt(ctx, crypt);
+ fz_throw(ctx, FZ_ERROR_GENERIC, "encryption dictionary missing user encryption key");
+ }
+ memcpy(crypt->ue, pdf_to_str_buf(obj), 32);
+ }
+
+ crypt->encrypt_metadata = 1;
+ obj = pdf_dict_gets(dict, "EncryptMetadata");
+ if (pdf_is_bool(obj))
+ crypt->encrypt_metadata = pdf_to_bool(obj);
+
+ /* Extract file identifier string */
+
+ if (pdf_is_array(id) && pdf_array_len(id) == 2)
+ {
+ obj = pdf_array_get(id, 0);
+ if (pdf_is_string(obj))
+ crypt->id = pdf_keep_obj(obj);
+ }
+ else
+ fz_warn(ctx, "missing file identifier, may not be able to do decryption");
+
+ /* Determine encryption key length */
+
+ crypt->length = 40;
+ if (crypt->v == 2 || crypt->v == 4)
+ {
+ obj = pdf_dict_gets(dict, "Length");
+ if (pdf_is_int(obj))
+ crypt->length = pdf_to_int(obj);
+
+ /* work-around for pdf generators that assume length is in bytes */
+ if (crypt->length < 40)
+ crypt->length = crypt->length * 8;
+
+ if (crypt->length % 8 != 0)
+ {
+ pdf_free_crypt(ctx, crypt);
+ fz_throw(ctx, FZ_ERROR_GENERIC, "invalid encryption key length");
+ }
+ if (crypt->length < 0 || crypt->length > 256)
+ {
+ pdf_free_crypt(ctx, crypt);
+ fz_throw(ctx, FZ_ERROR_GENERIC, "invalid encryption key length");
+ }
+ }
+
+ if (crypt->v == 5)
+ crypt->length = 256;
+
+ if (crypt->v == 1 || crypt->v == 2)
+ {
+ crypt->stmf.method = PDF_CRYPT_RC4;
+ crypt->stmf.length = crypt->length;
+
+ crypt->strf.method = PDF_CRYPT_RC4;
+ crypt->strf.length = crypt->length;
+ }
+
+ if (crypt->v == 4 || crypt->v == 5)
+ {
+ crypt->stmf.method = PDF_CRYPT_NONE;
+ crypt->stmf.length = crypt->length;
+
+ crypt->strf.method = PDF_CRYPT_NONE;
+ crypt->strf.length = crypt->length;
+
+ obj = pdf_dict_gets(dict, "CF");
+ if (pdf_is_dict(obj))
+ {
+ crypt->cf = pdf_keep_obj(obj);
+ }
+ else
+ {
+ crypt->cf = NULL;
+ }
+
+ fz_try(ctx)
+ {
+ obj = pdf_dict_gets(dict, "StmF");
+ if (pdf_is_name(obj))
+ pdf_parse_crypt_filter(ctx, &crypt->stmf, crypt, pdf_to_name(obj));
+
+ obj = pdf_dict_gets(dict, "StrF");
+ if (pdf_is_name(obj))
+ pdf_parse_crypt_filter(ctx, &crypt->strf, crypt, pdf_to_name(obj));
+ }
+ fz_catch(ctx)
+ {
+ pdf_free_crypt(ctx, crypt);
+ fz_rethrow_message(ctx, "cannot parse string crypt filter (%d %d R)", pdf_to_num(obj), pdf_to_gen(obj));
+ }
+
+ /* in crypt revision 4, the crypt filter determines the key length */
+ if (crypt->strf.method != PDF_CRYPT_NONE)
+ crypt->length = crypt->stmf.length;
+ }
+
+ return crypt;
+}
+
+void
+pdf_free_crypt(fz_context *ctx, pdf_crypt *crypt)
+{
+ pdf_drop_obj(crypt->id);
+ pdf_drop_obj(crypt->cf);
+ fz_free(ctx, crypt);
+}
+
+/*
+ * Parse a CF dictionary entry (PDF 1.7 table 3.22)
+ */
+
+static void
+pdf_parse_crypt_filter(fz_context *ctx, pdf_crypt_filter *cf, pdf_crypt *crypt, char *name)
+{
+ pdf_obj *obj;
+ pdf_obj *dict;
+ int is_identity = (strcmp(name, "Identity") == 0);
+ int is_stdcf = (!is_identity && (strcmp(name, "StdCF") == 0));
+
+ if (!is_identity && !is_stdcf)
+ fz_throw(ctx, FZ_ERROR_GENERIC, "Crypt Filter not Identity or StdCF (%d %d R)", pdf_to_num(crypt->cf), pdf_to_gen(crypt->cf));
+
+ cf->method = PDF_CRYPT_NONE;
+ cf->length = crypt->length;
+
+ if (!crypt->cf)
+ {
+ cf->method = (is_identity ? PDF_CRYPT_NONE : PDF_CRYPT_RC4);
+ return;
+ }
+
+ dict = pdf_dict_gets(crypt->cf, name);
+ if (!pdf_is_dict(dict))
+ fz_throw(ctx, FZ_ERROR_GENERIC, "cannot parse crypt filter (%d %d R)", pdf_to_num(crypt->cf), pdf_to_gen(crypt->cf));
+
+ obj = pdf_dict_gets(dict, "CFM");
+ if (pdf_is_name(obj))
+ {
+ if (!strcmp(pdf_to_name(obj), "None"))
+ cf->method = PDF_CRYPT_NONE;
+ else if (!strcmp(pdf_to_name(obj), "V2"))
+ cf->method = PDF_CRYPT_RC4;
+ else if (!strcmp(pdf_to_name(obj), "AESV2"))
+ cf->method = PDF_CRYPT_AESV2;
+ else if (!strcmp(pdf_to_name(obj), "AESV3"))
+ cf->method = PDF_CRYPT_AESV3;
+ else
+ fz_warn(ctx, "unknown encryption method: %s", pdf_to_name(obj));
+ }
+
+ obj = pdf_dict_gets(dict, "Length");
+ if (pdf_is_int(obj))
+ cf->length = pdf_to_int(obj);
+
+ /* the length for crypt filters is supposed to be in bytes not bits */
+ if (cf->length < 40)
+ cf->length = cf->length * 8;
+
+ if ((cf->length % 8) != 0)
+ fz_throw(ctx, FZ_ERROR_GENERIC, "invalid key length: %d", cf->length);
+
+ if ((crypt->r == 1 || crypt->r == 2 || crypt->r == 4) &&
+ (cf->length < 0 || cf->length > 128))
+ fz_throw(ctx, FZ_ERROR_GENERIC, "invalid key length: %d", cf->length);
+ if ((crypt->r == 5 || crypt->r == 6) && cf->length != 256)
+ fz_throw(ctx, FZ_ERROR_GENERIC, "invalid key length: %d", cf->length);
+}
+
+/*
+ * Compute an encryption key (PDF 1.7 algorithm 3.2)
+ */
+
+static const unsigned char padding[32] =
+{
+ 0x28, 0xbf, 0x4e, 0x5e, 0x4e, 0x75, 0x8a, 0x41,
+ 0x64, 0x00, 0x4e, 0x56, 0xff, 0xfa, 0x01, 0x08,
+ 0x2e, 0x2e, 0x00, 0xb6, 0xd0, 0x68, 0x3e, 0x80,
+ 0x2f, 0x0c, 0xa9, 0xfe, 0x64, 0x53, 0x69, 0x7a
+};
+
+static void
+pdf_compute_encryption_key(pdf_crypt *crypt, unsigned char *password, int pwlen, unsigned char *key)
+{
+ unsigned char buf[32];
+ unsigned int p;
+ int i, n;
+ fz_md5 md5;
+
+ n = crypt->length / 8;
+
+ /* Step 1 - copy and pad password string */
+ if (pwlen > 32)
+ pwlen = 32;
+ memcpy(buf, password, pwlen);
+ memcpy(buf + pwlen, padding, 32 - pwlen);
+
+ /* Step 2 - init md5 and pass value of step 1 */
+ fz_md5_init(&md5);
+ fz_md5_update(&md5, buf, 32);
+
+ /* Step 3 - pass O value */
+ fz_md5_update(&md5, crypt->o, 32);
+
+ /* Step 4 - pass P value as unsigned int, low-order byte first */
+ p = (unsigned int) crypt->p;
+ buf[0] = (p) & 0xFF;
+ buf[1] = (p >> 8) & 0xFF;
+ buf[2] = (p >> 16) & 0xFF;
+ buf[3] = (p >> 24) & 0xFF;
+ fz_md5_update(&md5, buf, 4);
+
+ /* Step 5 - pass first element of ID array */
+ fz_md5_update(&md5, (unsigned char *)pdf_to_str_buf(crypt->id), pdf_to_str_len(crypt->id));
+
+ /* Step 6 (revision 4 or greater) - if metadata is not encrypted pass 0xFFFFFFFF */
+ if (crypt->r >= 4)
+ {
+ if (!crypt->encrypt_metadata)
+ {
+ buf[0] = 0xFF;
+ buf[1] = 0xFF;
+ buf[2] = 0xFF;
+ buf[3] = 0xFF;
+ fz_md5_update(&md5, buf, 4);
+ }
+ }
+
+ /* Step 7 - finish the hash */
+ fz_md5_final(&md5, buf);
+
+ /* Step 8 (revision 3 or greater) - do some voodoo 50 times */
+ if (crypt->r >= 3)
+ {
+ for (i = 0; i < 50; i++)
+ {
+ fz_md5_init(&md5);
+ fz_md5_update(&md5, buf, n);
+ fz_md5_final(&md5, buf);
+ }
+ }
+
+ /* Step 9 - the key is the first 'n' bytes of the result */
+ memcpy(key, buf, n);
+}
+
+/*
+ * Compute an encryption key (PDF 1.7 ExtensionLevel 3 algorithm 3.2a)
+ */
+
+static void
+pdf_compute_encryption_key_r5(fz_context *ctx, pdf_crypt *crypt, unsigned char *password, int pwlen, int ownerkey, unsigned char *validationkey)
+{
+ unsigned char buffer[128 + 8 + 48];
+ fz_sha256 sha256;
+ fz_aes aes;
+
+ /* Step 2 - truncate UTF-8 password to 127 characters */
+
+ if (pwlen > 127)
+ pwlen = 127;
+
+ /* Step 3/4 - test password against owner/user key and compute encryption key */
+
+ memcpy(buffer, password, pwlen);
+ if (ownerkey)
+ {
+ memcpy(buffer + pwlen, crypt->o + 32, 8);
+ memcpy(buffer + pwlen + 8, crypt->u, 48);
+ }
+ else
+ memcpy(buffer + pwlen, crypt->u + 32, 8);
+
+ fz_sha256_init(&sha256);
+ fz_sha256_update(&sha256, buffer, pwlen + 8 + (ownerkey ? 48 : 0));
+ fz_sha256_final(&sha256, validationkey);
+
+ /* Step 3.5/4.5 - compute file encryption key from OE/UE */
+
+ memcpy(buffer + pwlen, crypt->u + 40, 8);
+
+ fz_sha256_init(&sha256);
+ fz_sha256_update(&sha256, buffer, pwlen + 8);
+ fz_sha256_final(&sha256, buffer);
+
+ /* clear password buffer and use it as iv */
+ memset(buffer + 32, 0, sizeof(buffer) - 32);
+ if (aes_setkey_dec(&aes, buffer, crypt->length))
+ fz_throw(ctx, FZ_ERROR_GENERIC, "AES key init failed (keylen=%d)", crypt->length);
+ aes_crypt_cbc(&aes, AES_DECRYPT, 32, buffer + 32, ownerkey ? crypt->oe : crypt->ue, crypt->key);
+}
+
+/*
+ * Compute an encryption key (PDF 1.7 ExtensionLevel 8 algorithm)
+ *
+ * Adobe has not yet released the details, so the algorithm reference is:
+ * http://esec-lab.sogeti.com/post/The-undocumented-password-validation-algorithm-of-Adobe-Reader-X
+ */
+
+static void
+pdf_compute_hardened_hash_r6(fz_context *ctx, unsigned char *password, int pwlen, unsigned char salt[16], unsigned char *ownerkey, unsigned char hash[32])
+{
+ unsigned char data[(128 + 64 + 48) * 64];
+ unsigned char block[64];
+ int block_size = 32;
+ int data_len = 0;
+ int i, j, sum;
+
+ fz_sha256 sha256;
+ fz_sha384 sha384;
+ fz_sha512 sha512;
+ fz_aes aes;
+
+ /* Step 1: calculate initial data block */
+ fz_sha256_init(&sha256);
+ fz_sha256_update(&sha256, password, pwlen);
+ fz_sha256_update(&sha256, salt, 8);
+ if (ownerkey)
+ fz_sha256_update(&sha256, ownerkey, 48);
+ fz_sha256_final(&sha256, block);
+
+ for (i = 0; i < 64 || i < data[data_len * 64 - 1] + 32; i++)
+ {
+ /* Step 2: repeat password and data block 64 times */
+ memcpy(data, password, pwlen);
+ memcpy(data + pwlen, block, block_size);
+ memcpy(data + pwlen + block_size, ownerkey, ownerkey ? 48 : 0);
+ data_len = pwlen + block_size + (ownerkey ? 48 : 0);
+ for (j = 1; j < 64; j++)
+ memcpy(data + j * data_len, data, data_len);
+
+ /* Step 3: encrypt data using data block as key and iv */
+ if (aes_setkey_enc(&aes, block, 128))
+ fz_throw(ctx, FZ_ERROR_GENERIC, "AES key init failed (keylen=%d)", 128);
+ aes_crypt_cbc(&aes, AES_ENCRYPT, data_len * 64, block + 16, data, data);
+
+ /* Step 4: determine SHA-2 hash size for this round */
+ for (j = 0, sum = 0; j < 16; j++)
+ sum += data[j];
+
+ /* Step 5: calculate data block for next round */
+ block_size = 32 + (sum % 3) * 16;
+ switch (block_size)
+ {
+ case 32:
+ fz_sha256_init(&sha256);
+ fz_sha256_update(&sha256, data, data_len * 64);
+ fz_sha256_final(&sha256, block);
+ break;
+ case 48:
+ fz_sha384_init(&sha384);
+ fz_sha384_update(&sha384, data, data_len * 64);
+ fz_sha384_final(&sha384, block);
+ break;
+ case 64:
+ fz_sha512_init(&sha512);
+ fz_sha512_update(&sha512, data, data_len * 64);
+ fz_sha512_final(&sha512, block);
+ break;
+ }
+ }
+
+ memset(data, 0, sizeof(data));
+ memcpy(hash, block, 32);
+}
+
+static void
+pdf_compute_encryption_key_r6(fz_context *ctx, pdf_crypt *crypt, unsigned char *password, int pwlen, int ownerkey, unsigned char *validationkey)
+{
+ unsigned char hash[32];
+ unsigned char iv[16];
+ fz_aes aes;
+
+ if (pwlen > 127)
+ pwlen = 127;
+
+ pdf_compute_hardened_hash_r6(ctx, password, pwlen,
+ (ownerkey ? crypt->o : crypt->u) + 32,
+ ownerkey ? crypt->u : NULL, validationkey);
+ pdf_compute_hardened_hash_r6(ctx, password, pwlen,
+ crypt->u + 40, NULL, hash);
+
+ memset(iv, 0, sizeof(iv));
+ if (aes_setkey_dec(&aes, hash, 256))
+ fz_throw(ctx, FZ_ERROR_GENERIC, "AES key init failed (keylen=256)");
+ aes_crypt_cbc(&aes, AES_DECRYPT, 32, iv,
+ ownerkey ? crypt->oe : crypt->ue, crypt->key);
+}
+
+/*
+ * Computing the user password (PDF 1.7 algorithm 3.4 and 3.5)
+ * Also save the generated key for decrypting objects and streams in crypt->key.
+ */
+
+static void
+pdf_compute_user_password(fz_context *ctx, pdf_crypt *crypt, unsigned char *password, int pwlen, unsigned char *output)
+{
+ if (crypt->r == 2)
+ {
+ fz_arc4 arc4;
+
+ pdf_compute_encryption_key(crypt, password, pwlen, crypt->key);
+ fz_arc4_init(&arc4, crypt->key, crypt->length / 8);
+ fz_arc4_encrypt(&arc4, output, padding, 32);
+ }
+
+ if (crypt->r == 3 || crypt->r == 4)
+ {
+ unsigned char xor[32];
+ unsigned char digest[16];
+ fz_md5 md5;
+ fz_arc4 arc4;
+ int i, x, n;
+
+ n = crypt->length / 8;
+
+ pdf_compute_encryption_key(crypt, password, pwlen, crypt->key);
+
+ fz_md5_init(&md5);
+ fz_md5_update(&md5, padding, 32);
+ fz_md5_update(&md5, (unsigned char*)pdf_to_str_buf(crypt->id), pdf_to_str_len(crypt->id));
+ fz_md5_final(&md5, digest);
+
+ fz_arc4_init(&arc4, crypt->key, n);
+ fz_arc4_encrypt(&arc4, output, digest, 16);
+
+ for (x = 1; x <= 19; x++)
+ {
+ for (i = 0; i < n; i++)
+ xor[i] = crypt->key[i] ^ x;
+ fz_arc4_init(&arc4, xor, n);
+ fz_arc4_encrypt(&arc4, output, output, 16);
+ }
+
+ memcpy(output + 16, padding, 16);
+ }
+
+ if (crypt->r == 5)
+ {
+ pdf_compute_encryption_key_r5(ctx, crypt, password, pwlen, 0, output);
+ }
+
+ if (crypt->r == 6)
+ {
+ pdf_compute_encryption_key_r6(ctx, crypt, password, pwlen, 0, output);
+ }
+}
+
+/*
+ * Authenticating the user password (PDF 1.7 algorithm 3.6
+ * and ExtensionLevel 3 algorithm 3.11)
+ * This also has the side effect of saving a key generated
+ * from the password for decrypting objects and streams.
+ */
+
+static int
+pdf_authenticate_user_password(fz_context *ctx, pdf_crypt *crypt, unsigned char *password, int pwlen)
+{
+ unsigned char output[32];
+ pdf_compute_user_password(ctx, crypt, password, pwlen, output);
+ if (crypt->r == 2 || crypt->r == 5 || crypt->r == 6)
+ return memcmp(output, crypt->u, 32) == 0;
+ if (crypt->r == 3 || crypt->r == 4)
+ return memcmp(output, crypt->u, 16) == 0;
+ return 0;
+}
+
+/*
+ * Authenticating the owner password (PDF 1.7 algorithm 3.7
+ * and ExtensionLevel 3 algorithm 3.12)
+ * Generates the user password from the owner password
+ * and calls pdf_authenticate_user_password.
+ */
+
+static int
+pdf_authenticate_owner_password(fz_context *ctx, pdf_crypt *crypt, unsigned char *ownerpass, int pwlen)
+{
+ unsigned char pwbuf[32];
+ unsigned char key[32];
+ unsigned char xor[32];
+ unsigned char userpass[32];
+ int i, n, x;
+ fz_md5 md5;
+ fz_arc4 arc4;
+
+ if (crypt->r == 5)
+ {
+ /* PDF 1.7 ExtensionLevel 3 algorithm 3.12 */
+ pdf_compute_encryption_key_r5(ctx, crypt, ownerpass, pwlen, 1, key);
+ return !memcmp(key, crypt->o, 32);
+ }
+ else if (crypt->r == 6)
+ {
+ /* PDF 1.7 ExtensionLevel 8 algorithm */
+ pdf_compute_encryption_key_r6(ctx, crypt, ownerpass, pwlen, 1, key);
+ return !memcmp(key, crypt->o, 32);
+ }
+
+ n = crypt->length / 8;
+
+ /* Step 1 -- steps 1 to 4 of PDF 1.7 algorithm 3.3 */
+
+ /* copy and pad password string */
+ if (pwlen > 32)
+ pwlen = 32;
+ memcpy(pwbuf, ownerpass, pwlen);
+ memcpy(pwbuf + pwlen, padding, 32 - pwlen);
+
+ /* take md5 hash of padded password */
+ fz_md5_init(&md5);
+ fz_md5_update(&md5, pwbuf, 32);
+ fz_md5_final(&md5, key);
+
+ /* do some voodoo 50 times (Revision 3 or greater) */
+ if (crypt->r >= 3)
+ {
+ for (i = 0; i < 50; i++)
+ {
+ fz_md5_init(&md5);
+ fz_md5_update(&md5, key, 16);
+ fz_md5_final(&md5, key);
+ }
+ }
+
+ /* Step 2 (Revision 2) */
+ if (crypt->r == 2)
+ {
+ fz_arc4_init(&arc4, key, n);
+ fz_arc4_encrypt(&arc4, userpass, crypt->o, 32);
+ }
+
+ /* Step 2 (Revision 3 or greater) */
+ if (crypt->r >= 3)
+ {
+ memcpy(userpass, crypt->o, 32);
+ for (x = 0; x < 20; x++)
+ {
+ for (i = 0; i < n; i++)
+ xor[i] = key[i] ^ (19 - x);
+ fz_arc4_init(&arc4, xor, n);
+ fz_arc4_encrypt(&arc4, userpass, userpass, 32);
+ }
+ }
+
+ return pdf_authenticate_user_password(ctx, crypt, userpass, 32);
+}
+
+static void pdf_docenc_from_utf8(char *password, const char *utf8, int n)
+{
+ int i = 0, k, c;
+ while (*utf8 && i + 1 < n)
+ {
+ utf8 += fz_chartorune(&c, utf8);
+ for (k = 0; k < 256; k++)
+ {
+ if (c == pdf_doc_encoding[k])
+ {
+ password[i++] = k;
+ break;
+ }
+ }
+ /* FIXME: drop characters that can't be encoded or return an error? */
+ }
+ password[i] = 0;
+}
+
+static void pdf_saslprep_from_utf8(char *password, const char *utf8, int n)
+{
+ /* TODO: stringprep with SALSprep profile */
+ fz_strlcpy(password, utf8, n);
+}
+
+int
+pdf_authenticate_password(pdf_document *xref, const char *pwd_utf8)
+{
+ char password[2048];
+
+ if (xref->crypt)
+ {
+ password[0] = 0;
+ if (pwd_utf8)
+ {
+ if (xref->crypt->r <= 4)
+ pdf_docenc_from_utf8(password, pwd_utf8, sizeof password);
+ else
+ pdf_saslprep_from_utf8(password, pwd_utf8, sizeof password);
+ }
+
+ if (pdf_authenticate_user_password(xref->ctx, xref->crypt, (unsigned char *)password, strlen(password)))
+ return 1;
+ if (pdf_authenticate_owner_password(xref->ctx, xref->crypt, (unsigned char *)password, strlen(password)))
+ return 1;
+ return 0;
+ }
+ return 1;
+}
+
+int
+pdf_needs_password(pdf_document *xref)
+{
+ if (!xref->crypt)
+ return 0;
+ if (pdf_authenticate_password(xref, ""))
+ return 0;
+ return 1;
+}
+
+int
+pdf_has_permission(pdf_document *xref, int p)
+{
+ if (!xref->crypt)
+ return 1;
+ return xref->crypt->p & p;
+}
+
+unsigned char *
+pdf_crypt_key(pdf_document *xref)
+{
+ if (xref->crypt)
+ return xref->crypt->key;
+ return NULL;
+}
+
+int
+pdf_crypt_version(pdf_document *xref)
+{
+ if (xref->crypt)
+ return xref->crypt->v;
+ return 0;
+}
+
+int pdf_crypt_revision(pdf_document *xref)
+{
+ if (xref->crypt)
+ return xref->crypt->r;
+ return 0;
+}
+
+char *
+pdf_crypt_method(pdf_document *xref)
+{
+ if (xref->crypt)
+ {
+ switch (xref->crypt->strf.method)
+ {
+ case PDF_CRYPT_NONE: return "None";
+ case PDF_CRYPT_RC4: return "RC4";
+ case PDF_CRYPT_AESV2: return "AES";
+ case PDF_CRYPT_AESV3: return "AES";
+ case PDF_CRYPT_UNKNOWN: return "Unknown";
+ }
+ }
+ return "None";
+}
+
+int
+pdf_crypt_length(pdf_document *xref)
+{
+ if (xref->crypt)
+ return xref->crypt->length;
+ return 0;
+}
+
+/*
+ * PDF 1.7 algorithm 3.1 and ExtensionLevel 3 algorithm 3.1a
+ *
+ * Using the global encryption key that was generated from the
+ * password, create a new key that is used to decrypt individual
+ * objects and streams. This key is based on the object and
+ * generation numbers.
+ */
+
+static int
+pdf_compute_object_key(pdf_crypt *crypt, pdf_crypt_filter *cf, int num, int gen, unsigned char *key, int max_len)
+{
+ fz_md5 md5;
+ unsigned char message[5];
+ int key_len = crypt->length / 8;
+
+ if (key_len > max_len)
+ key_len = max_len;
+
+ if (cf->method == PDF_CRYPT_AESV3)
+ {
+ memcpy(key, crypt->key, key_len);
+ return key_len;
+ }
+
+ fz_md5_init(&md5);
+ fz_md5_update(&md5, crypt->key, key_len);
+ message[0] = (num) & 0xFF;
+ message[1] = (num >> 8) & 0xFF;
+ message[2] = (num >> 16) & 0xFF;
+ message[3] = (gen) & 0xFF;
+ message[4] = (gen >> 8) & 0xFF;
+ fz_md5_update(&md5, message, 5);
+
+ if (cf->method == PDF_CRYPT_AESV2)
+ fz_md5_update(&md5, (unsigned char *)"sAlT", 4);
+
+ fz_md5_final(&md5, key);
+
+ if (key_len + 5 > 16)
+ return 16;
+ return key_len + 5;
+}
+
+/*
+ * PDF 1.7 algorithm 3.1 and ExtensionLevel 3 algorithm 3.1a
+ *
+ * Decrypt all strings in obj modifying the data in-place.
+ * Recurse through arrays and dictionaries, but do not follow
+ * indirect references.
+ */
+
+static void
+pdf_crypt_obj_imp(fz_context *ctx, pdf_crypt *crypt, pdf_obj *obj, unsigned char *key, int keylen)
+{
+ unsigned char *s;
+ int i, n;
+
+ if (pdf_is_indirect(obj))
+ return;
+
+ if (pdf_is_string(obj))
+ {
+ s = (unsigned char *)pdf_to_str_buf(obj);
+ n = pdf_to_str_len(obj);
+
+ if (crypt->strf.method == PDF_CRYPT_RC4)
+ {
+ fz_arc4 arc4;
+ fz_arc4_init(&arc4, key, keylen);
+ fz_arc4_encrypt(&arc4, s, s, n);
+ }
+
+ if (crypt->strf.method == PDF_CRYPT_AESV2 || crypt->strf.method == PDF_CRYPT_AESV3)
+ {
+ if (n == 0)
+ {
+ /* Empty strings are permissible */
+ }
+ else if (n & 15 || n < 32)
+ fz_warn(ctx, "invalid string length for aes encryption");
+ else
+ {
+ unsigned char iv[16];
+ fz_aes aes;
+ memcpy(iv, s, 16);
+ if (aes_setkey_dec(&aes, key, keylen * 8))
+ fz_throw(ctx, FZ_ERROR_GENERIC, "AES key init failed (keylen=%d)", keylen * 8);
+ aes_crypt_cbc(&aes, AES_DECRYPT, n - 16, iv, s + 16, s);
+ /* delete space used for iv and padding bytes at end */
+ if (s[n - 17] < 1 || s[n - 17] > 16)
+ fz_warn(ctx, "aes padding out of range");
+ else
+ pdf_set_str_len(obj, n - 16 - s[n - 17]);
+ }
+ }
+ }
+
+ else if (pdf_is_array(obj))
+ {
+ n = pdf_array_len(obj);
+ for (i = 0; i < n; i++)
+ {
+ pdf_crypt_obj_imp(ctx, crypt, pdf_array_get(obj, i), key, keylen);
+ }
+ }
+
+ else if (pdf_is_dict(obj))
+ {
+ n = pdf_dict_len(obj);
+ for (i = 0; i < n; i++)
+ {
+ pdf_crypt_obj_imp(ctx, crypt, pdf_dict_get_val(obj, i), key, keylen);
+ }
+ }
+}
+
+void
+pdf_crypt_obj(fz_context *ctx, pdf_crypt *crypt, pdf_obj *obj, int num, int gen)
+{
+ unsigned char key[32];
+ int len;
+
+ len = pdf_compute_object_key(crypt, &crypt->strf, num, gen, key, 32);
+
+ pdf_crypt_obj_imp(ctx, crypt, obj, key, len);
+}
+
+/*
+ * PDF 1.7 algorithm 3.1 and ExtensionLevel 3 algorithm 3.1a
+ *
+ * Create filter suitable for de/encrypting a stream.
+ */
+static fz_stream *
+pdf_open_crypt_imp(fz_stream *chain, pdf_crypt *crypt, pdf_crypt_filter *stmf, int num, int gen)
+{
+ unsigned char key[32];
+ int len;
+
+ crypt->ctx = chain->ctx;
+ len = pdf_compute_object_key(crypt, stmf, num, gen, key, 32);
+
+ if (stmf->method == PDF_CRYPT_RC4)
+ return fz_open_arc4(chain, key, len);
+
+ if (stmf->method == PDF_CRYPT_AESV2 || stmf->method == PDF_CRYPT_AESV3)
+ return fz_open_aesd(chain, key, len);
+
+ return fz_open_copy(chain);
+}
+
+fz_stream *
+pdf_open_crypt(fz_stream *chain, pdf_crypt *crypt, int num, int gen)
+{
+ return pdf_open_crypt_imp(chain, crypt, &crypt->stmf, num, gen);
+}
+
+fz_stream *
+pdf_open_crypt_with_filter(fz_stream *chain, pdf_crypt *crypt, char *name, int num, int gen)
+{
+ if (strcmp(name, "Identity"))
+ {
+ pdf_crypt_filter cf;
+ pdf_parse_crypt_filter(chain->ctx, &cf, crypt, name);
+ return pdf_open_crypt_imp(chain, crypt, &cf, num, gen);
+ }
+ return chain;
+}
+
+#ifndef NDEBUG
+void pdf_print_crypt(pdf_crypt *crypt)
+{
+ int i;
+
+ printf("crypt {\n");
+
+ printf("\tv=%d length=%d\n", crypt->v, crypt->length);
+ printf("\tstmf method=%d length=%d\n", crypt->stmf.method, crypt->stmf.length);
+ printf("\tstrf method=%d length=%d\n", crypt->strf.method, crypt->strf.length);
+ printf("\tr=%d\n", crypt->r);
+
+ printf("\to=<");
+ for (i = 0; i < 32; i++)
+ printf("%02X", crypt->o[i]);
+ printf(">\n");
+
+ printf("\tu=<");
+ for (i = 0; i < 32; i++)
+ printf("%02X", crypt->u[i]);
+ printf(">\n");
+
+ printf("}\n");
+}
+#endif