// Copyright 2017 PDFium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #include "core/fpdfapi/parser/cpdf_hint_tables.h" #include #include #include #include "core/fpdfapi/cpdf_modulemgr.h" #include "core/fpdfapi/parser/cpdf_data_avail.h" #include "core/fpdfapi/parser/cpdf_dictionary.h" #include "core/fpdfapi/parser/cpdf_linearized_header.h" #include "core/fpdfapi/parser/cpdf_object.h" #include "core/fpdfapi/parser/cpdf_read_validator.h" #include "core/fpdfapi/parser/cpdf_stream.h" #include "core/fpdfapi/parser/cpdf_syntax_parser.h" #include "core/fxcrt/cfx_readonlymemorystream.h" #include "core/fxcrt/fx_stream.h" #include "testing/gmock/include/gmock/gmock.h" #include "testing/gtest/include/gtest/gtest.h" #include "testing/utils/path_service.h" #include "third_party/base/ptr_util.h" namespace { RetainPtr MakeValidatorFromFile( const std::string& file_name) { std::string file_path; PathService::GetTestFilePath(file_name, &file_path); ASSERT(!file_path.empty()); return pdfium::MakeRetain( IFX_SeekableReadStream::CreateFromFilename(file_path.c_str()), nullptr); } std::unique_ptr MakeDataAvailFromFile( const std::string& file_name) { return pdfium::MakeUnique( nullptr, MakeValidatorFromFile(file_name), true); } class TestLinearizedHeader final : public CPDF_LinearizedHeader { public: TestLinearizedHeader(const CPDF_Dictionary* pDict, FX_FILESIZE szLastXRefOffset) : CPDF_LinearizedHeader(pDict, szLastXRefOffset) {} static std::unique_ptr MakeHeader( const std::string& inline_data) { CPDF_SyntaxParser parser(pdfium::MakeRetain( pdfium::as_bytes(pdfium::make_span(inline_data)))); std::unique_ptr dict = ToDictionary(parser.GetObjectBody(nullptr)); ASSERT(dict); return pdfium::MakeUnique(dict.get(), 0); } }; } // namespace class CPDF_HintTablesTest : public testing::Test { public: CPDF_HintTablesTest() { // Needs for encoding Hint table stream. CPDF_ModuleMgr::Get()->Init(); } ~CPDF_HintTablesTest() override { CPDF_ModuleMgr::Destroy(); } }; TEST_F(CPDF_HintTablesTest, Load) { auto data_avail = MakeDataAvailFromFile("feature_linearized_loading.pdf"); ASSERT_EQ(CPDF_DataAvail::DocAvailStatus::DataAvailable, data_avail->IsDocAvail(nullptr)); ASSERT_TRUE(data_avail->GetHintTables()); const CPDF_HintTables* hint_tables = data_avail->GetHintTables(); FX_FILESIZE page_start = 0; FX_FILESIZE page_length = 0; uint32_t page_obj_num = 0; ASSERT_TRUE( hint_tables->GetPagePos(0, &page_start, &page_length, &page_obj_num)); EXPECT_EQ(777, page_start); EXPECT_EQ(4328, page_length); EXPECT_EQ(39u, page_obj_num); ASSERT_TRUE( hint_tables->GetPagePos(1, &page_start, &page_length, &page_obj_num)); EXPECT_EQ(5105, page_start); EXPECT_EQ(767, page_length); EXPECT_EQ(1u, page_obj_num); ASSERT_FALSE( hint_tables->GetPagePos(2, &page_start, &page_length, &page_obj_num)); } TEST_F(CPDF_HintTablesTest, PageAndGroupInfos) { auto data_avail = MakeDataAvailFromFile("feature_linearized_loading.pdf"); ASSERT_EQ(CPDF_DataAvail::DocAvailStatus::DataAvailable, data_avail->IsDocAvail(nullptr)); const CPDF_HintTables* hint_tables = data_avail->GetHintTables(); ASSERT_TRUE(hint_tables); ASSERT_EQ(2u, hint_tables->PageInfos().size()); EXPECT_EQ(5u, hint_tables->PageInfos()[0].objects_count()); EXPECT_EQ(777, hint_tables->PageInfos()[0].page_offset()); EXPECT_EQ(4328u, hint_tables->PageInfos()[0].page_length()); EXPECT_EQ(39u, hint_tables->PageInfos()[0].start_obj_num()); ASSERT_EQ(2u, hint_tables->PageInfos()[0].Identifiers().size()); EXPECT_EQ(0u, hint_tables->PageInfos()[0].Identifiers()[0]); EXPECT_EQ(0u, hint_tables->PageInfos()[0].Identifiers()[1]); EXPECT_EQ(3u, hint_tables->PageInfos()[1].objects_count()); EXPECT_EQ(5105, hint_tables->PageInfos()[1].page_offset()); EXPECT_EQ(767u, hint_tables->PageInfos()[1].page_length()); EXPECT_EQ(1u, hint_tables->PageInfos()[1].start_obj_num()); ASSERT_EQ(3u, hint_tables->PageInfos()[1].Identifiers().size()); EXPECT_EQ(2u, hint_tables->PageInfos()[1].Identifiers()[0]); EXPECT_EQ(5u, hint_tables->PageInfos()[1].Identifiers()[1]); EXPECT_EQ(3u, hint_tables->PageInfos()[1].Identifiers()[2]); // SharedGroupInfo ASSERT_EQ(6u, hint_tables->SharedGroupInfos().size()); EXPECT_EQ(777, hint_tables->SharedGroupInfos()[0].m_szOffset); EXPECT_EQ(254u, hint_tables->SharedGroupInfos()[0].m_dwLength); EXPECT_EQ(39u, hint_tables->SharedGroupInfos()[0].m_dwStartObjNum); EXPECT_EQ(1u, hint_tables->SharedGroupInfos()[0].m_dwObjectsCount); EXPECT_EQ(1031, hint_tables->SharedGroupInfos()[1].m_szOffset); EXPECT_EQ(389u, hint_tables->SharedGroupInfos()[1].m_dwLength); EXPECT_EQ(40u, hint_tables->SharedGroupInfos()[1].m_dwStartObjNum); EXPECT_EQ(1u, hint_tables->SharedGroupInfos()[1].m_dwObjectsCount); EXPECT_EQ(1420, hint_tables->SharedGroupInfos()[2].m_szOffset); EXPECT_EQ(726u, hint_tables->SharedGroupInfos()[2].m_dwLength); EXPECT_EQ(41u, hint_tables->SharedGroupInfos()[2].m_dwStartObjNum); EXPECT_EQ(1u, hint_tables->SharedGroupInfos()[2].m_dwObjectsCount); EXPECT_EQ(2146, hint_tables->SharedGroupInfos()[3].m_szOffset); EXPECT_EQ(290u, hint_tables->SharedGroupInfos()[3].m_dwLength); EXPECT_EQ(42u, hint_tables->SharedGroupInfos()[3].m_dwStartObjNum); EXPECT_EQ(1u, hint_tables->SharedGroupInfos()[3].m_dwObjectsCount); EXPECT_EQ(2436, hint_tables->SharedGroupInfos()[4].m_szOffset); EXPECT_EQ(2669u, hint_tables->SharedGroupInfos()[4].m_dwLength); EXPECT_EQ(43u, hint_tables->SharedGroupInfos()[4].m_dwStartObjNum); EXPECT_EQ(1u, hint_tables->SharedGroupInfos()[4].m_dwObjectsCount); EXPECT_EQ(10939, hint_tables->SharedGroupInfos()[5].m_szOffset); EXPECT_EQ(544u, hint_tables->SharedGroupInfos()[5].m_dwLength); EXPECT_EQ(4u, hint_tables->SharedGroupInfos()[5].m_dwStartObjNum); EXPECT_EQ(1u, hint_tables->SharedGroupInfos()[5].m_dwObjectsCount); } TEST_F(CPDF_HintTablesTest, FirstPageOffset) { // Test that valid hint table is loaded, and have correct offset of first page // object. const auto linearized_header = TestLinearizedHeader::MakeHeader( "<< /Linearized 1 /L 19326762 /H [ 123730 3816 ] /O 5932 /E 639518 /N " "102 /T 19220281 >>"); ASSERT_TRUE(linearized_header); // This hint table is extracted from linearized file, generated by qpdf tool. RetainPtr validator = MakeValidatorFromFile("hint_table_102p.bin"); CPDF_SyntaxParser parser(validator, 0); std::unique_ptr stream = ToStream(parser.GetObjectBody(nullptr)); ASSERT_TRUE(stream); auto hint_tables = pdfium::MakeUnique( validator.Get(), linearized_header.get()); // Check that hint table will load. ASSERT_TRUE(hint_tables->LoadHintStream(stream.get())); // Check that hint table have correct first page offset. // 127546 is predefined real value from original file. EXPECT_EQ(127546, hint_tables->GetFirstPageObjOffset()); }