// Copyright 2016 PDFium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com #include "core/fpdfapi/edit/cpdf_pagecontentgenerator.h" #include #include #include "core/fpdfapi/font/cpdf_font.h" #include "core/fpdfapi/page/cpdf_docpagedata.h" #include "core/fpdfapi/page/cpdf_image.h" #include "core/fpdfapi/page/cpdf_imageobject.h" #include "core/fpdfapi/page/cpdf_page.h" #include "core/fpdfapi/page/cpdf_path.h" #include "core/fpdfapi/page/cpdf_pathobject.h" #include "core/fpdfapi/page/cpdf_textobject.h" #include "core/fpdfapi/parser/cpdf_array.h" #include "core/fpdfapi/parser/cpdf_dictionary.h" #include "core/fpdfapi/parser/cpdf_document.h" #include "core/fpdfapi/parser/cpdf_name.h" #include "core/fpdfapi/parser/cpdf_number.h" #include "core/fpdfapi/parser/cpdf_reference.h" #include "core/fpdfapi/parser/cpdf_stream.h" #include "core/fpdfapi/parser/fpdf_parser_decode.h" #include "core/fpdfapi/parser/fpdf_parser_utility.h" #include "third_party/skia_shared/SkFloatToDecimal.h" namespace { std::ostream& operator<<(std::ostream& ar, const CFX_Matrix& matrix) { ar << matrix.a << " " << matrix.b << " " << matrix.c << " " << matrix.d << " " << matrix.e << " " << matrix.f; return ar; } bool GetColor(const CPDF_Color* pColor, float* rgb) { int intRGB[3]; if (!pColor || !pColor->IsColorSpaceRGB() || !pColor->GetRGB(&intRGB[0], &intRGB[1], &intRGB[2])) { return false; } rgb[0] = intRGB[0] / 255.0f; rgb[1] = intRGB[1] / 255.0f; rgb[2] = intRGB[2] / 255.0f; return true; } } // namespace CPDF_PageContentGenerator::CPDF_PageContentGenerator( CPDF_PageObjectHolder* pObjHolder) : m_pObjHolder(pObjHolder), m_pDocument(pObjHolder->GetDocument()) { for (const auto& pObj : *pObjHolder->GetPageObjectList()) { if (pObj) m_pageObjects.emplace_back(pObj.get()); } } CPDF_PageContentGenerator::~CPDF_PageContentGenerator() {} void CPDF_PageContentGenerator::GenerateContent() { ASSERT(m_pObjHolder->IsPage()); CPDF_Document* pDoc = m_pDocument.Get(); std::ostringstream buf; // Set the default graphic state values buf << "q\n"; if (!m_pObjHolder->GetLastCTM().IsIdentity()) buf << m_pObjHolder->GetLastCTM().GetInverse() << " cm\n"; ProcessDefaultGraphics(&buf); // Process the page objects if (!ProcessPageObjects(&buf)) return; // Return graphics to original state buf << "Q\n"; // Add buffer to a stream in page's 'Contents' CPDF_Dictionary* pPageDict = m_pObjHolder->GetDict(); if (!pPageDict) return; CPDF_Object* pContent = pPageDict->GetObjectFor("Contents"); CPDF_Stream* pStream = pDoc->NewIndirect(); pStream->SetData(&buf); if (pContent) { CPDF_Array* pArray = ToArray(pContent); if (pArray) { pArray->Add(pStream->MakeReference(pDoc)); return; } CPDF_Reference* pReference = ToReference(pContent); if (!pReference) { pPageDict->SetFor("Contents", pStream->MakeReference(pDoc)); return; } CPDF_Object* pDirectObj = pReference->GetDirect(); if (!pDirectObj) { pPageDict->SetFor("Contents", pStream->MakeReference(pDoc)); return; } CPDF_Array* pObjArray = pDirectObj->AsArray(); if (pObjArray) { pObjArray->Add(pStream->MakeReference(pDoc)); return; } if (pDirectObj->IsStream()) { CPDF_Array* pContentArray = pDoc->NewIndirect(); pContentArray->Add(pDirectObj->MakeReference(pDoc)); pContentArray->Add(pStream->MakeReference(pDoc)); pPageDict->SetFor("Contents", pContentArray->MakeReference(pDoc)); return; } } pPageDict->SetFor("Contents", pStream->MakeReference(pDoc)); } ByteString CPDF_PageContentGenerator::RealizeResource( const CPDF_Object* pResource, const ByteString& bsType) { ASSERT(pResource); if (!m_pObjHolder->m_pResources) { m_pObjHolder->m_pResources = m_pDocument->NewIndirect(); m_pObjHolder->GetDict()->SetFor( "Resources", m_pObjHolder->m_pResources->MakeReference(m_pDocument.Get())); } CPDF_Dictionary* pResList = m_pObjHolder->m_pResources->GetDictFor(bsType); if (!pResList) pResList = m_pObjHolder->m_pResources->SetNewFor(bsType); ByteString name; int idnum = 1; while (1) { name = ByteString::Format("FX%c%d", bsType[0], idnum); if (!pResList->KeyExist(name)) break; idnum++; } pResList->SetFor(name, pResource->MakeReference(m_pDocument.Get())); return name; } bool CPDF_PageContentGenerator::ProcessPageObjects(std::ostringstream* buf) { bool bDirty = false; for (auto& pPageObj : m_pageObjects) { if (m_pObjHolder->IsPage() && !pPageObj->IsDirty()) continue; bDirty = true; if (CPDF_ImageObject* pImageObject = pPageObj->AsImage()) ProcessImage(buf, pImageObject); else if (CPDF_PathObject* pPathObj = pPageObj->AsPath()) ProcessPath(buf, pPathObj); else if (CPDF_TextObject* pTextObj = pPageObj->AsText()) ProcessText(buf, pTextObj); pPageObj->SetDirty(false); } return bDirty; } void CPDF_PageContentGenerator::ProcessImage(std::ostringstream* buf, CPDF_ImageObject* pImageObj) { if ((pImageObj->matrix().a == 0 && pImageObj->matrix().b == 0) || (pImageObj->matrix().c == 0 && pImageObj->matrix().d == 0)) { return; } *buf << "q " << pImageObj->matrix() << " cm "; RetainPtr pImage = pImageObj->GetImage(); if (pImage->IsInline()) return; CPDF_Stream* pStream = pImage->GetStream(); if (!pStream) return; bool bWasInline = pStream->IsInline(); if (bWasInline) pImage->ConvertStreamToIndirectObject(); ByteString name = RealizeResource(pStream, "XObject"); if (bWasInline) pImageObj->SetImage( m_pDocument->GetPageData()->GetImage(pStream->GetObjNum())); *buf << "/" << PDF_NameEncode(name) << " Do Q\n"; } // Processing path with operators from Tables 4.9 and 4.10 of PDF spec 1.7: // "re" appends a rectangle (here, used only if the whole path is a rectangle) // "m" moves current point to the given coordinates // "l" creates a line from current point to the new point // "c" adds a Bezier curve from current to last point, using the two other // points as the Bezier control points // Note: "l", "c" change the current point // "h" closes the subpath (appends a line from current to starting point) // Path painting operators: "S", "n", "B", "f", "B*", "f*", depending on // the filling mode and whether we want stroking the path or not. // "Q" restores the graphics state imposed by the ProcessGraphics method. void CPDF_PageContentGenerator::ProcessPath(std::ostringstream* buf, CPDF_PathObject* pPathObj) { ProcessGraphics(buf, pPathObj); *buf << pPathObj->m_Matrix << " cm "; auto& pPoints = pPathObj->m_Path.GetPoints(); if (pPathObj->m_Path.IsRect()) { CFX_PointF diff = pPoints[2].m_Point - pPoints[0].m_Point; *buf << pPoints[0].m_Point.x << " " << pPoints[0].m_Point.y << " " << diff.x << " " << diff.y << " re"; } else { for (size_t i = 0; i < pPoints.size(); i++) { if (i > 0) *buf << " "; char buffer[pdfium::skia::kMaximumSkFloatToDecimalLength]; unsigned size = pdfium::skia::SkFloatToDecimal(pPoints[i].m_Point.x, buffer); buf->write(buffer, size) << " "; size = pdfium::skia::SkFloatToDecimal(pPoints[i].m_Point.y, buffer); buf->write(buffer, size); FXPT_TYPE pointType = pPoints[i].m_Type; if (pointType == FXPT_TYPE::MoveTo) { *buf << " m"; } else if (pointType == FXPT_TYPE::LineTo) { *buf << " l"; } else if (pointType == FXPT_TYPE::BezierTo) { if (i + 2 >= pPoints.size() || !pPoints[i].IsTypeAndOpen(FXPT_TYPE::BezierTo) || !pPoints[i + 1].IsTypeAndOpen(FXPT_TYPE::BezierTo) || pPoints[i + 2].m_Type != FXPT_TYPE::BezierTo) { // If format is not supported, close the path and paint *buf << " h"; break; } *buf << " " << pPoints[i + 1].m_Point.x << " " << pPoints[i + 1].m_Point.y << " " << pPoints[i + 2].m_Point.x << " " << pPoints[i + 2].m_Point.y << " c"; i += 2; } if (pPoints[i].m_CloseFigure) *buf << " h"; } } if (pPathObj->m_FillType == 0) *buf << (pPathObj->m_bStroke ? " S" : " n"); else if (pPathObj->m_FillType == FXFILL_WINDING) *buf << (pPathObj->m_bStroke ? " B" : " f"); else if (pPathObj->m_FillType == FXFILL_ALTERNATE) *buf << (pPathObj->m_bStroke ? " B*" : " f*"); *buf << " Q\n"; } // This method supports color operators rg and RGB from Table 4.24 of PDF spec // 1.7. A color will not be set if the colorspace is not DefaultRGB or the RGB // values cannot be obtained. The method also adds an external graphics // dictionary, as described in Section 4.3.4. // "rg" sets the fill color, "RG" sets the stroke color (using DefaultRGB) // "w" sets the stroke line width. // "ca" sets the fill alpha, "CA" sets the stroke alpha. // "q" saves the graphics state, so that the settings can later be reversed void CPDF_PageContentGenerator::ProcessGraphics(std::ostringstream* buf, CPDF_PageObject* pPageObj) { *buf << "q "; float fillColor[3]; if (GetColor(pPageObj->m_ColorState.GetFillColor(), fillColor)) { *buf << fillColor[0] << " " << fillColor[1] << " " << fillColor[2] << " rg "; } float strokeColor[3]; if (GetColor(pPageObj->m_ColorState.GetStrokeColor(), strokeColor)) { *buf << strokeColor[0] << " " << strokeColor[1] << " " << strokeColor[2] << " RG "; } float lineWidth = pPageObj->m_GraphState.GetLineWidth(); if (lineWidth != 1.0f) *buf << lineWidth << " w "; CFX_GraphStateData::LineCap lineCap = pPageObj->m_GraphState.GetLineCap(); if (lineCap != CFX_GraphStateData::LineCapButt) *buf << static_cast(lineCap) << " J "; CFX_GraphStateData::LineJoin lineJoin = pPageObj->m_GraphState.GetLineJoin(); if (lineJoin != CFX_GraphStateData::LineJoinMiter) *buf << static_cast(lineJoin) << " j "; GraphicsData graphD; graphD.fillAlpha = pPageObj->m_GeneralState.GetFillAlpha(); graphD.strokeAlpha = pPageObj->m_GeneralState.GetStrokeAlpha(); graphD.blendType = pPageObj->m_GeneralState.GetBlendType(); if (graphD.fillAlpha == 1.0f && graphD.strokeAlpha == 1.0f && (graphD.blendType == FXDIB_BLEND_UNSUPPORTED || graphD.blendType == FXDIB_BLEND_NORMAL)) { return; } ByteString name; auto it = m_pObjHolder->m_GraphicsMap.find(graphD); if (it != m_pObjHolder->m_GraphicsMap.end()) { name = it->second; } else { auto gsDict = pdfium::MakeUnique(); if (graphD.fillAlpha != 1.0f) gsDict->SetNewFor("ca", graphD.fillAlpha); if (graphD.strokeAlpha != 1.0f) gsDict->SetNewFor("CA", graphD.strokeAlpha); if (graphD.blendType != FXDIB_BLEND_UNSUPPORTED && graphD.blendType != FXDIB_BLEND_NORMAL) { gsDict->SetNewFor("BM", pPageObj->m_GeneralState.GetBlendMode()); } CPDF_Object* pDict = m_pDocument->AddIndirectObject(std::move(gsDict)); name = RealizeResource(pDict, "ExtGState"); m_pObjHolder->m_GraphicsMap[graphD] = name; } *buf << "/" << PDF_NameEncode(name) << " gs "; } void CPDF_PageContentGenerator::ProcessDefaultGraphics( std::ostringstream* buf) { *buf << "0 0 0 RG 0 0 0 rg 1 w " << static_cast(CFX_GraphStateData::LineCapButt) << " J " << static_cast(CFX_GraphStateData::LineJoinMiter) << " j\n"; GraphicsData defaultGraphics; defaultGraphics.fillAlpha = 1.0f; defaultGraphics.strokeAlpha = 1.0f; defaultGraphics.blendType = FXDIB_BLEND_NORMAL; auto it = m_pObjHolder->m_GraphicsMap.find(defaultGraphics); ByteString name; if (it != m_pObjHolder->m_GraphicsMap.end()) { name = it->second; } else { auto gsDict = pdfium::MakeUnique(); gsDict->SetNewFor("ca", defaultGraphics.fillAlpha); gsDict->SetNewFor("CA", defaultGraphics.strokeAlpha); gsDict->SetNewFor("BM", "Normal"); CPDF_Object* pDict = m_pDocument->AddIndirectObject(std::move(gsDict)); name = RealizeResource(pDict, "ExtGState"); m_pObjHolder->m_GraphicsMap[defaultGraphics] = name; } *buf << "/" << PDF_NameEncode(name).c_str() << " gs "; } // This method adds text to the buffer, BT begins the text object, ET ends it. // Tm sets the text matrix (allows positioning and transforming text). // Tf sets the font name (from Font in Resources) and font size. // Tj sets the actual text, <####...> is used when specifying charcodes. void CPDF_PageContentGenerator::ProcessText(std::ostringstream* buf, CPDF_TextObject* pTextObj) { ProcessGraphics(buf, pTextObj); *buf << "BT " << pTextObj->GetTextMatrix() << " Tm "; CPDF_Font* pFont = pTextObj->GetFont(); if (!pFont) pFont = CPDF_Font::GetStockFont(m_pDocument.Get(), "Helvetica"); FontData fontD; if (pFont->IsType1Font()) fontD.type = "Type1"; else if (pFont->IsTrueTypeFont()) fontD.type = "TrueType"; else if (pFont->IsCIDFont()) fontD.type = "Type0"; else return; fontD.baseFont = pFont->GetBaseFont(); auto it = m_pObjHolder->m_FontsMap.find(fontD); ByteString dictName; if (it != m_pObjHolder->m_FontsMap.end()) { dictName = it->second; } else { CPDF_Object* pIndirectFont = pFont->GetFontDict(); if (pIndirectFont->IsInline()) { // In this case we assume it must be a standard font auto fontDict = pdfium::MakeUnique(); fontDict->SetNewFor("Type", "Font"); fontDict->SetNewFor("Subtype", fontD.type); fontDict->SetNewFor("BaseFont", fontD.baseFont); pIndirectFont = m_pDocument->AddIndirectObject(std::move(fontDict)); } dictName = RealizeResource(pIndirectFont, "Font"); m_pObjHolder->m_FontsMap[fontD] = dictName; } *buf << "/" << PDF_NameEncode(dictName) << " " << pTextObj->GetFontSize() << " Tf "; ByteString text; for (uint32_t charcode : pTextObj->GetCharCodes()) { if (charcode != CPDF_Font::kInvalidCharCode) pFont->AppendChar(&text, charcode); } *buf << PDF_EncodeString(text, true) << " Tj ET"; *buf << " Q\n"; }