diff options
Diffstat (limited to 'fpdfsdk/fpdf_flatten.cpp')
-rw-r--r-- | fpdfsdk/fpdf_flatten.cpp | 518 |
1 files changed, 518 insertions, 0 deletions
diff --git a/fpdfsdk/fpdf_flatten.cpp b/fpdfsdk/fpdf_flatten.cpp new file mode 100644 index 0000000000..cca63d6b76 --- /dev/null +++ b/fpdfsdk/fpdf_flatten.cpp @@ -0,0 +1,518 @@ +// Copyright 2014 PDFium Authors. All rights reserved. +// Use of this source code is governed by a BSD-style license that can be +// found in the LICENSE file. + +// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com + +#include "public/fpdf_flatten.h" + +#include <algorithm> + +#include "core/include/fpdfapi/cpdf_array.h" +#include "core/include/fpdfapi/cpdf_document.h" +#include "core/include/fpdfapi/cpdf_number.h" +#include "fpdfsdk/include/fsdk_define.h" + +typedef CFX_ArrayTemplate<CPDF_Dictionary*> CPDF_ObjectArray; +typedef CFX_ArrayTemplate<CFX_FloatRect> CPDF_RectArray; + +enum FPDF_TYPE { MAX, MIN }; +enum FPDF_VALUE { TOP, LEFT, RIGHT, BOTTOM }; + +FX_BOOL IsValiableRect(CFX_FloatRect rect, CFX_FloatRect rcPage) { + if (rect.left - rect.right > 0.000001f || rect.bottom - rect.top > 0.000001f) + return FALSE; + + if (rect.left == 0.0f && rect.top == 0.0f && rect.right == 0.0f && + rect.bottom == 0.0f) + return FALSE; + + if (!rcPage.IsEmpty()) { + if (rect.left - rcPage.left < -10.000001f || + rect.right - rcPage.right > 10.000001f || + rect.top - rcPage.top > 10.000001f || + rect.bottom - rcPage.bottom < -10.000001f) + return FALSE; + } + + return TRUE; +} + +void GetContentsRect(CPDF_Document* pDoc, + CPDF_Dictionary* pDict, + CPDF_RectArray* pRectArray) { + std::unique_ptr<CPDF_Page> pPDFPage(new CPDF_Page); + pPDFPage->Load(pDoc, pDict, FALSE); + pPDFPage->ParseContent(nullptr); + + for (auto& pPageObject : *pPDFPage->GetPageObjectList()) { + if (!pPageObject) + continue; + + CFX_FloatRect rc; + rc.left = pPageObject->m_Left; + rc.right = pPageObject->m_Right; + rc.bottom = pPageObject->m_Bottom; + rc.top = pPageObject->m_Top; + if (IsValiableRect(rc, pDict->GetRectBy("MediaBox"))) + pRectArray->Add(rc); + } +} + +void ParserStream(CPDF_Dictionary* pPageDic, + CPDF_Dictionary* pStream, + CPDF_RectArray* pRectArray, + CPDF_ObjectArray* pObjectArray) { + if (!pStream) + return; + CFX_FloatRect rect; + if (pStream->KeyExist("Rect")) + rect = pStream->GetRectBy("Rect"); + else if (pStream->KeyExist("BBox")) + rect = pStream->GetRectBy("BBox"); + + if (IsValiableRect(rect, pPageDic->GetRectBy("MediaBox"))) + pRectArray->Add(rect); + + pObjectArray->Add(pStream); +} + +int ParserAnnots(CPDF_Document* pSourceDoc, + CPDF_Dictionary* pPageDic, + CPDF_RectArray* pRectArray, + CPDF_ObjectArray* pObjectArray, + int nUsage) { + if (!pSourceDoc || !pPageDic) + return FLATTEN_FAIL; + + GetContentsRect(pSourceDoc, pPageDic, pRectArray); + CPDF_Array* pAnnots = pPageDic->GetArrayBy("Annots"); + if (!pAnnots) + return FLATTEN_NOTHINGTODO; + + FX_DWORD dwSize = pAnnots->GetCount(); + for (int i = 0; i < (int)dwSize; i++) { + CPDF_Dictionary* pAnnotDic = ToDictionary(pAnnots->GetElementValue(i)); + if (!pAnnotDic) + continue; + + CFX_ByteString sSubtype = pAnnotDic->GetStringBy("Subtype"); + if (sSubtype == "Popup") + continue; + + int nAnnotFlag = pAnnotDic->GetIntegerBy("F"); + if (nAnnotFlag & ANNOTFLAG_HIDDEN) + continue; + + if (nUsage == FLAT_NORMALDISPLAY) { + if (nAnnotFlag & ANNOTFLAG_INVISIBLE) + continue; + + ParserStream(pPageDic, pAnnotDic, pRectArray, pObjectArray); + } else { + if (nAnnotFlag & ANNOTFLAG_PRINT) + ParserStream(pPageDic, pAnnotDic, pRectArray, pObjectArray); + } + } + return FLATTEN_SUCCESS; +} + +FX_FLOAT GetMinMaxValue(CPDF_RectArray& array, + FPDF_TYPE type, + FPDF_VALUE value) { + int nRects = array.GetSize(); + FX_FLOAT fRet = 0.0f; + + if (nRects <= 0) + return 0.0f; + + FX_FLOAT* pArray = new FX_FLOAT[nRects]; + switch (value) { + case LEFT: { + for (int i = 0; i < nRects; i++) + pArray[i] = CFX_FloatRect(array.GetAt(i)).left; + + break; + } + case TOP: { + for (int i = 0; i < nRects; i++) + pArray[i] = CFX_FloatRect(array.GetAt(i)).top; + + break; + } + case RIGHT: { + for (int i = 0; i < nRects; i++) + pArray[i] = CFX_FloatRect(array.GetAt(i)).right; + + break; + } + case BOTTOM: { + for (int i = 0; i < nRects; i++) + pArray[i] = CFX_FloatRect(array.GetAt(i)).bottom; + + break; + } + default: + break; + } + fRet = pArray[0]; + if (type == MAX) { + for (int i = 1; i < nRects; i++) + if (fRet <= pArray[i]) + fRet = pArray[i]; + } else { + for (int i = 1; i < nRects; i++) + if (fRet >= pArray[i]) + fRet = pArray[i]; + } + delete[] pArray; + return fRet; +} + +CFX_FloatRect CalculateRect(CPDF_RectArray* pRectArray) { + CFX_FloatRect rcRet; + + rcRet.left = GetMinMaxValue(*pRectArray, MIN, LEFT); + rcRet.top = GetMinMaxValue(*pRectArray, MAX, TOP); + rcRet.right = GetMinMaxValue(*pRectArray, MAX, RIGHT); + rcRet.bottom = GetMinMaxValue(*pRectArray, MIN, BOTTOM); + + return rcRet; +} + +void SetPageContents(CFX_ByteString key, + CPDF_Dictionary* pPage, + CPDF_Document* pDocument) { + CPDF_Object* pContentsObj = pPage->GetStreamBy("Contents"); + if (!pContentsObj) { + pContentsObj = pPage->GetArrayBy("Contents"); + } + + if (!pContentsObj) { + // Create a new contents dictionary + if (!key.IsEmpty()) { + CPDF_Stream* pNewContents = new CPDF_Stream(NULL, 0, new CPDF_Dictionary); + pPage->SetAtReference("Contents", pDocument, + pDocument->AddIndirectObject(pNewContents)); + + CFX_ByteString sStream; + sStream.Format("q 1 0 0 1 0 0 cm /%s Do Q", key.c_str()); + pNewContents->SetData((const uint8_t*)sStream, sStream.GetLength(), FALSE, + FALSE); + } + return; + } + + CPDF_Array* pContentsArray = NULL; + + switch (pContentsObj->GetType()) { + case CPDF_Object::STREAM: { + pContentsArray = new CPDF_Array; + CPDF_Stream* pContents = pContentsObj->AsStream(); + FX_DWORD dwObjNum = pDocument->AddIndirectObject(pContents); + CPDF_StreamAcc acc; + acc.LoadAllData(pContents); + CFX_ByteString sStream = "q\n"; + CFX_ByteString sBody = + CFX_ByteString((const FX_CHAR*)acc.GetData(), acc.GetSize()); + sStream = sStream + sBody + "\nQ"; + pContents->SetData((const uint8_t*)sStream, sStream.GetLength(), FALSE, + FALSE); + pContentsArray->AddReference(pDocument, dwObjNum); + break; + } + + case CPDF_Object::ARRAY: { + pContentsArray = pContentsObj->AsArray(); + break; + } + default: + break; + } + + if (!pContentsArray) + return; + + FX_DWORD dwObjNum = pDocument->AddIndirectObject(pContentsArray); + pPage->SetAtReference("Contents", pDocument, dwObjNum); + + if (!key.IsEmpty()) { + CPDF_Stream* pNewContents = new CPDF_Stream(NULL, 0, new CPDF_Dictionary); + dwObjNum = pDocument->AddIndirectObject(pNewContents); + pContentsArray->AddReference(pDocument, dwObjNum); + + CFX_ByteString sStream; + sStream.Format("q 1 0 0 1 0 0 cm /%s Do Q", key.c_str()); + pNewContents->SetData((const uint8_t*)sStream, sStream.GetLength(), FALSE, + FALSE); + } +} + +CFX_Matrix GetMatrix(CFX_FloatRect rcAnnot, + CFX_FloatRect rcStream, + const CFX_Matrix& matrix) { + if (rcStream.IsEmpty()) + return CFX_Matrix(); + + matrix.TransformRect(rcStream); + rcStream.Normalize(); + + FX_FLOAT a = rcAnnot.Width() / rcStream.Width(); + FX_FLOAT d = rcAnnot.Height() / rcStream.Height(); + + FX_FLOAT e = rcAnnot.left - rcStream.left * a; + FX_FLOAT f = rcAnnot.bottom - rcStream.bottom * d; + return CFX_Matrix(a, 0, 0, d, e, f); +} + +void GetOffset(FX_FLOAT& fa, + FX_FLOAT& fd, + FX_FLOAT& fe, + FX_FLOAT& ff, + CFX_FloatRect rcAnnot, + CFX_FloatRect rcStream, + const CFX_Matrix& matrix) { + FX_FLOAT fStreamWidth = 0.0f; + FX_FLOAT fStreamHeight = 0.0f; + + if (matrix.a != 0 && matrix.d != 0) { + fStreamWidth = rcStream.right - rcStream.left; + fStreamHeight = rcStream.top - rcStream.bottom; + } else { + fStreamWidth = rcStream.top - rcStream.bottom; + fStreamHeight = rcStream.right - rcStream.left; + } + + FX_FLOAT x1 = + matrix.a * rcStream.left + matrix.c * rcStream.bottom + matrix.e; + FX_FLOAT y1 = + matrix.b * rcStream.left + matrix.d * rcStream.bottom + matrix.f; + FX_FLOAT x2 = matrix.a * rcStream.left + matrix.c * rcStream.top + matrix.e; + FX_FLOAT y2 = matrix.b * rcStream.left + matrix.d * rcStream.top + matrix.f; + FX_FLOAT x3 = + matrix.a * rcStream.right + matrix.c * rcStream.bottom + matrix.e; + FX_FLOAT y3 = + matrix.b * rcStream.right + matrix.d * rcStream.bottom + matrix.f; + FX_FLOAT x4 = matrix.a * rcStream.right + matrix.c * rcStream.top + matrix.e; + FX_FLOAT y4 = matrix.b * rcStream.right + matrix.d * rcStream.top + matrix.f; + + FX_FLOAT left = std::min(std::min(x1, x2), std::min(x3, x4)); + FX_FLOAT bottom = std::min(std::min(y1, y2), std::min(y3, y4)); + + fa = (rcAnnot.right - rcAnnot.left) / fStreamWidth; + fd = (rcAnnot.top - rcAnnot.bottom) / fStreamHeight; + fe = rcAnnot.left - left * fa; + ff = rcAnnot.bottom - bottom * fd; +} + +DLLEXPORT int STDCALL FPDFPage_Flatten(FPDF_PAGE page, int nFlag) { + CPDF_Page* pPage = CPDFPageFromFPDFPage(page); + if (!page) { + return FLATTEN_FAIL; + } + + CPDF_Document* pDocument = pPage->m_pDocument; + CPDF_Dictionary* pPageDict = pPage->m_pFormDict; + + if (!pDocument || !pPageDict) { + return FLATTEN_FAIL; + } + + CPDF_ObjectArray ObjectArray; + CPDF_RectArray RectArray; + + int iRet = FLATTEN_FAIL; + iRet = ParserAnnots(pDocument, pPageDict, &RectArray, &ObjectArray, nFlag); + if (iRet == FLATTEN_NOTHINGTODO || iRet == FLATTEN_FAIL) + return iRet; + + CFX_FloatRect rcOriginalCB; + CFX_FloatRect rcMerger = CalculateRect(&RectArray); + CFX_FloatRect rcOriginalMB = pPageDict->GetRectBy("MediaBox"); + + if (pPageDict->KeyExist("CropBox")) + rcOriginalMB = pPageDict->GetRectBy("CropBox"); + + if (rcOriginalMB.IsEmpty()) { + rcOriginalMB = CFX_FloatRect(0.0f, 0.0f, 612.0f, 792.0f); + } + + rcMerger.left = + rcMerger.left < rcOriginalMB.left ? rcOriginalMB.left : rcMerger.left; + rcMerger.right = + rcMerger.right > rcOriginalMB.right ? rcOriginalMB.right : rcMerger.right; + rcMerger.top = + rcMerger.top > rcOriginalMB.top ? rcOriginalMB.top : rcMerger.top; + rcMerger.bottom = rcMerger.bottom < rcOriginalMB.bottom ? rcOriginalMB.bottom + : rcMerger.bottom; + + if (pPageDict->KeyExist("ArtBox")) + rcOriginalCB = pPageDict->GetRectBy("ArtBox"); + else + rcOriginalCB = rcOriginalMB; + + if (!rcOriginalMB.IsEmpty()) { + CPDF_Array* pMediaBox = new CPDF_Array(); + pMediaBox->Add(new CPDF_Number(rcOriginalMB.left)); + pMediaBox->Add(new CPDF_Number(rcOriginalMB.bottom)); + pMediaBox->Add(new CPDF_Number(rcOriginalMB.right)); + pMediaBox->Add(new CPDF_Number(rcOriginalMB.top)); + pPageDict->SetAt("MediaBox", pMediaBox); + } + + if (!rcOriginalCB.IsEmpty()) { + CPDF_Array* pCropBox = new CPDF_Array(); + pCropBox->Add(new CPDF_Number(rcOriginalCB.left)); + pCropBox->Add(new CPDF_Number(rcOriginalCB.bottom)); + pCropBox->Add(new CPDF_Number(rcOriginalCB.right)); + pCropBox->Add(new CPDF_Number(rcOriginalCB.top)); + pPageDict->SetAt("ArtBox", pCropBox); + } + + CPDF_Dictionary* pRes = pPageDict->GetDictBy("Resources"); + if (!pRes) { + pRes = new CPDF_Dictionary; + pPageDict->SetAt("Resources", pRes); + } + + CPDF_Stream* pNewXObject = new CPDF_Stream(NULL, 0, new CPDF_Dictionary); + FX_DWORD dwObjNum = pDocument->AddIndirectObject(pNewXObject); + CPDF_Dictionary* pPageXObject = pRes->GetDictBy("XObject"); + if (!pPageXObject) { + pPageXObject = new CPDF_Dictionary; + pRes->SetAt("XObject", pPageXObject); + } + + CFX_ByteString key = ""; + int nStreams = ObjectArray.GetSize(); + + if (nStreams > 0) { + for (int iKey = 0; /*iKey < 100*/; iKey++) { + char sExtend[5] = {}; + FXSYS_itoa(iKey, sExtend, 10); + key = CFX_ByteString("FFT") + CFX_ByteString(sExtend); + + if (!pPageXObject->KeyExist(key)) + break; + } + } + + SetPageContents(key, pPageDict, pDocument); + + CPDF_Dictionary* pNewXORes = NULL; + + if (!key.IsEmpty()) { + pPageXObject->SetAtReference(key, pDocument, dwObjNum); + CPDF_Dictionary* pNewOXbjectDic = pNewXObject->GetDict(); + pNewXORes = new CPDF_Dictionary; + pNewOXbjectDic->SetAt("Resources", pNewXORes); + pNewOXbjectDic->SetAtName("Type", "XObject"); + pNewOXbjectDic->SetAtName("Subtype", "Form"); + pNewOXbjectDic->SetAtInteger("FormType", 1); + pNewOXbjectDic->SetAtName("Name", "FRM"); + CFX_FloatRect rcBBox = pPageDict->GetRectBy("ArtBox"); + pNewOXbjectDic->SetAtRect("BBox", rcBBox); + } + + for (int i = 0; i < nStreams; i++) { + CPDF_Dictionary* pAnnotDic = ObjectArray.GetAt(i); + if (!pAnnotDic) + continue; + + CFX_FloatRect rcAnnot = pAnnotDic->GetRectBy("Rect"); + rcAnnot.Normalize(); + + CFX_ByteString sAnnotState = pAnnotDic->GetStringBy("AS"); + CPDF_Dictionary* pAnnotAP = pAnnotDic->GetDictBy("AP"); + if (!pAnnotAP) + continue; + + CPDF_Stream* pAPStream = pAnnotAP->GetStreamBy("N"); + if (!pAPStream) { + CPDF_Dictionary* pAPDic = pAnnotAP->GetDictBy("N"); + if (!pAPDic) + continue; + + if (!sAnnotState.IsEmpty()) { + pAPStream = pAPDic->GetStreamBy(sAnnotState); + } else { + auto it = pAPDic->begin(); + if (it != pAPDic->end()) { + CPDF_Object* pFirstObj = it->second; + if (pFirstObj) { + if (pFirstObj->IsReference()) + pFirstObj = pFirstObj->GetDirect(); + if (!pFirstObj->IsStream()) + continue; + pAPStream = pFirstObj->AsStream(); + } + } + } + } + if (!pAPStream) + continue; + + CPDF_Dictionary* pAPDic = pAPStream->GetDict(); + CFX_Matrix matrix = pAPDic->GetMatrixBy("Matrix"); + + CFX_FloatRect rcStream; + if (pAPDic->KeyExist("Rect")) + rcStream = pAPDic->GetRectBy("Rect"); + else if (pAPDic->KeyExist("BBox")) + rcStream = pAPDic->GetRectBy("BBox"); + + if (rcStream.IsEmpty()) + continue; + + CPDF_Object* pObj = pAPStream; + + if (pObj) { + CPDF_Dictionary* pObjDic = pObj->GetDict(); + if (pObjDic) { + pObjDic->SetAtName("Type", "XObject"); + pObjDic->SetAtName("Subtype", "Form"); + } + } + + CPDF_Dictionary* pXObject = pNewXORes->GetDictBy("XObject"); + if (!pXObject) { + pXObject = new CPDF_Dictionary; + pNewXORes->SetAt("XObject", pXObject); + } + + CFX_ByteString sFormName; + sFormName.Format("F%d", i); + FX_DWORD dwObjNum = pDocument->AddIndirectObject(pObj); + pXObject->SetAtReference(sFormName, pDocument, dwObjNum); + + CPDF_StreamAcc acc; + acc.LoadAllData(pNewXObject); + + const uint8_t* pData = acc.GetData(); + CFX_ByteString sStream(pData, acc.GetSize()); + CFX_ByteString sTemp; + + if (matrix.IsIdentity()) { + matrix.a = 1.0f; + matrix.b = 0.0f; + matrix.c = 0.0f; + matrix.d = 1.0f; + matrix.e = 0.0f; + matrix.f = 0.0f; + } + + CFX_Matrix m = GetMatrix(rcAnnot, rcStream, matrix); + sTemp.Format("q %f 0 0 %f %f %f cm /%s Do Q\n", m.a, m.d, m.e, m.f, + sFormName.c_str()); + sStream += sTemp; + + pNewXObject->SetData((const uint8_t*)sStream, sStream.GetLength(), FALSE, + FALSE); + } + pPageDict->RemoveAt("Annots"); + + ObjectArray.RemoveAll(); + RectArray.RemoveAll(); + + return FLATTEN_SUCCESS; +} |