// Copyright 2016 PDFium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com #include "core/fpdfapi/parser/cpdf_stream.h" #include #include #include "constants/stream_dict_common.h" #include "core/fpdfapi/edit/cpdf_encryptor.h" #include "core/fpdfapi/edit/cpdf_flateencoder.h" #include "core/fpdfapi/parser/cpdf_dictionary.h" #include "core/fpdfapi/parser/cpdf_number.h" #include "core/fpdfapi/parser/cpdf_stream_acc.h" #include "core/fpdfapi/parser/fpdf_parser_decode.h" #include "core/fxcrt/fx_stream.h" #include "third_party/base/numerics/safe_conversions.h" #include "third_party/base/ptr_util.h" #include "third_party/base/stl_util.h" namespace { bool IsMetaDataStreamDictionary(const CPDF_Dictionary* dict) { return dict && dict->GetStringFor("Type") == "Metadata" && dict->GetStringFor("Subtype") == "XML"; } } // namespace CPDF_Stream::CPDF_Stream() {} CPDF_Stream::CPDF_Stream(std::unique_ptr pData, uint32_t size, std::unique_ptr pDict) : m_pDict(std::move(pDict)) { SetData(std::move(pData), size); } CPDF_Stream::~CPDF_Stream() { m_ObjNum = kInvalidObjNum; if (m_pDict && m_pDict->GetObjNum() == kInvalidObjNum) m_pDict.release(); // lowercase release, release ownership. } CPDF_Object::Type CPDF_Stream::GetType() const { return kStream; } CPDF_Dictionary* CPDF_Stream::GetDict() { return m_pDict.get(); } const CPDF_Dictionary* CPDF_Stream::GetDict() const { return m_pDict.get(); } bool CPDF_Stream::IsStream() const { return true; } CPDF_Stream* CPDF_Stream::AsStream() { return this; } const CPDF_Stream* CPDF_Stream::AsStream() const { return this; } void CPDF_Stream::InitStream(pdfium::span pData, std::unique_ptr pDict) { m_pDict = std::move(pDict); SetData(pData); } void CPDF_Stream::InitStreamFromFile( const RetainPtr& pFile, std::unique_ptr pDict) { m_pDict = std::move(pDict); m_bMemoryBased = false; m_pDataBuf.reset(); m_pFile = pFile; m_dwSize = pdfium::base::checked_cast(pFile->GetSize()); if (m_pDict) m_pDict->SetNewFor("Length", static_cast(m_dwSize)); } std::unique_ptr CPDF_Stream::Clone() const { return CloneObjectNonCyclic(false); } std::unique_ptr CPDF_Stream::CloneNonCyclic( bool bDirect, std::set* pVisited) const { pVisited->insert(this); auto pAcc = pdfium::MakeRetain(this); pAcc->LoadAllDataRaw(); uint32_t streamSize = pAcc->GetSize(); const CPDF_Dictionary* pDict = GetDict(); std::unique_ptr pNewDict; if (pDict && !pdfium::ContainsKey(*pVisited, pDict)) { pNewDict = ToDictionary(static_cast(pDict)->CloneNonCyclic( bDirect, pVisited)); } return pdfium::MakeUnique(pAcc->DetachData(), streamSize, std::move(pNewDict)); } void CPDF_Stream::SetDataAndRemoveFilter(pdfium::span pData) { SetData(pData); m_pDict->RemoveFor("Filter"); m_pDict->RemoveFor(pdfium::stream::kDecodeParms); } void CPDF_Stream::SetDataFromStringstreamAndRemoveFilter( std::ostringstream* stream) { if (stream->tellp() <= 0) { SetDataAndRemoveFilter({}); return; } SetDataAndRemoveFilter( {reinterpret_cast(stream->str().c_str()), static_cast(stream->tellp())}); } void CPDF_Stream::SetData(pdfium::span pData) { std::unique_ptr data_copy; if (!pData.empty()) { data_copy.reset(FX_Alloc(uint8_t, pData.size())); memcpy(data_copy.get(), pData.data(), pData.size()); } SetData(std::move(data_copy), pData.size()); } void CPDF_Stream::SetData(std::unique_ptr pData, uint32_t size) { m_bMemoryBased = true; m_pFile = nullptr; m_pDataBuf = std::move(pData); m_dwSize = size; if (!m_pDict) m_pDict = pdfium::MakeUnique(); m_pDict->SetNewFor("Length", static_cast(size)); } void CPDF_Stream::SetDataFromStringstream(std::ostringstream* stream) { if (stream->tellp() <= 0) { SetData({}); return; } SetData({reinterpret_cast(stream->str().c_str()), static_cast(stream->tellp())}); } bool CPDF_Stream::ReadRawData(FX_FILESIZE offset, uint8_t* buf, uint32_t size) const { if (!m_bMemoryBased && m_pFile) return m_pFile->ReadBlock(buf, offset, size); if (m_pDataBuf) memcpy(buf, m_pDataBuf.get() + offset, size); return true; } bool CPDF_Stream::HasFilter() const { return m_pDict && m_pDict->KeyExist("Filter"); } WideString CPDF_Stream::GetUnicodeText() const { auto pAcc = pdfium::MakeRetain(this); pAcc->LoadAllDataFiltered(); return PDF_DecodeText(pAcc->GetData(), pAcc->GetSize()); } bool CPDF_Stream::WriteTo(IFX_ArchiveStream* archive, const CPDF_Encryptor* encryptor) const { const bool is_metadata = IsMetaDataStreamDictionary(GetDict()); CPDF_FlateEncoder encoder(this, !is_metadata); std::vector encrypted_data; pdfium::span data = encoder.GetSpan(); if (encryptor && !is_metadata) { encrypted_data = encryptor->Encrypt(data); data = encrypted_data; } if (static_cast(encoder.GetDict()->GetIntegerFor("Length")) != data.size()) { encoder.CloneDict(); encoder.GetClonedDict()->SetNewFor( "Length", static_cast(data.size())); } if (!encoder.GetDict()->WriteTo(archive, encryptor)) return false; if (!archive->WriteString("stream\r\n") || !archive->WriteBlock(data.data(), data.size()) || !archive->WriteString("\r\nendstream")) { return false; } return true; }