// Copyright 2014 PDFium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com #include "public/fpdf_text.h" #include "core/fpdfapi/fpdf_page/include/cpdf_page.h" #include "core/fpdftext/include/ipdf_linkextract.h" #include "core/fpdftext/include/ipdf_textpage.h" #include "core/fpdftext/include/ipdf_textpagefind.h" #include "core/include/fpdfdoc/fpdf_doc.h" #include "fpdfsdk/include/fsdk_define.h" #ifdef PDF_ENABLE_XFA #include "fpdfsdk/include/fpdfxfa/fpdfxfa_doc.h" #include "fpdfsdk/include/fpdfxfa/fpdfxfa_page.h" #endif // PDF_ENABLE_XFA #ifdef _WIN32 #include <tchar.h> #endif DLLEXPORT FPDF_TEXTPAGE STDCALL FPDFText_LoadPage(FPDF_PAGE page) { CPDF_Page* pPDFPage = CPDFPageFromFPDFPage(page); if (!pPDFPage) return nullptr; #ifdef PDF_ENABLE_XFA CPDFXFA_Page* pPage = (CPDFXFA_Page*)page; CPDFXFA_Document* pDoc = pPage->GetDocument(); CPDF_ViewerPreferences viewRef(pDoc->GetPDFDoc()); #else // PDF_ENABLE_XFA CPDF_ViewerPreferences viewRef(pPDFPage->m_pDocument); #endif // PDF_ENABLE_XFA IPDF_TextPage* textpage = IPDF_TextPage::CreateTextPage(pPDFPage, viewRef.IsDirectionR2L()); textpage->ParseTextPage(); return textpage; } DLLEXPORT void STDCALL FPDFText_ClosePage(FPDF_TEXTPAGE text_page) { delete (IPDF_TextPage*)text_page; } DLLEXPORT int STDCALL FPDFText_CountChars(FPDF_TEXTPAGE text_page) { if (!text_page) return -1; IPDF_TextPage* textpage = (IPDF_TextPage*)text_page; return textpage->CountChars(); } DLLEXPORT unsigned int STDCALL FPDFText_GetUnicode(FPDF_TEXTPAGE text_page, int index) { if (!text_page) return -1; IPDF_TextPage* textpage = (IPDF_TextPage*)text_page; if (index < 0 || index >= textpage->CountChars()) return 0; FPDF_CHAR_INFO charinfo; textpage->GetCharInfo(index, &charinfo); return charinfo.m_Unicode; } DLLEXPORT double STDCALL FPDFText_GetFontSize(FPDF_TEXTPAGE text_page, int index) { if (!text_page) return 0; IPDF_TextPage* textpage = (IPDF_TextPage*)text_page; if (index < 0 || index >= textpage->CountChars()) return 0; FPDF_CHAR_INFO charinfo; textpage->GetCharInfo(index, &charinfo); return charinfo.m_FontSize; } DLLEXPORT void STDCALL FPDFText_GetCharBox(FPDF_TEXTPAGE text_page, int index, double* left, double* right, double* bottom, double* top) { if (!text_page) return; IPDF_TextPage* textpage = (IPDF_TextPage*)text_page; if (index < 0 || index >= textpage->CountChars()) return; FPDF_CHAR_INFO charinfo; textpage->GetCharInfo(index, &charinfo); *left = charinfo.m_CharBox.left; *right = charinfo.m_CharBox.right; *bottom = charinfo.m_CharBox.bottom; *top = charinfo.m_CharBox.top; } // select DLLEXPORT int STDCALL FPDFText_GetCharIndexAtPos(FPDF_TEXTPAGE text_page, double x, double y, double xTolerance, double yTolerance) { if (!text_page) return -3; IPDF_TextPage* textpage = (IPDF_TextPage*)text_page; return textpage->GetIndexAtPos((FX_FLOAT)x, (FX_FLOAT)y, (FX_FLOAT)xTolerance, (FX_FLOAT)yTolerance); } DLLEXPORT int STDCALL FPDFText_GetText(FPDF_TEXTPAGE text_page, int start, int count, unsigned short* result) { if (!text_page) return 0; IPDF_TextPage* textpage = (IPDF_TextPage*)text_page; if (start >= textpage->CountChars()) return 0; CFX_WideString str = textpage->GetPageText(start, count); if (str.GetLength() > count) str = str.Left(count); CFX_ByteString cbUTF16str = str.UTF16LE_Encode(); FXSYS_memcpy(result, cbUTF16str.GetBuffer(cbUTF16str.GetLength()), cbUTF16str.GetLength()); cbUTF16str.ReleaseBuffer(cbUTF16str.GetLength()); return cbUTF16str.GetLength() / sizeof(unsigned short); } DLLEXPORT int STDCALL FPDFText_CountRects(FPDF_TEXTPAGE text_page, int start, int count) { if (!text_page) return 0; IPDF_TextPage* textpage = (IPDF_TextPage*)text_page; return textpage->CountRects(start, count); } DLLEXPORT void STDCALL FPDFText_GetRect(FPDF_TEXTPAGE text_page, int rect_index, double* left, double* top, double* right, double* bottom) { if (!text_page) return; IPDF_TextPage* textpage = (IPDF_TextPage*)text_page; CFX_FloatRect rect; textpage->GetRect(rect_index, rect.left, rect.top, rect.right, rect.bottom); *left = rect.left; *top = rect.top; *right = rect.right; *bottom = rect.bottom; } DLLEXPORT int STDCALL FPDFText_GetBoundedText(FPDF_TEXTPAGE text_page, double left, double top, double right, double bottom, unsigned short* buffer, int buflen) { if (!text_page) return 0; IPDF_TextPage* textpage = (IPDF_TextPage*)text_page; CFX_FloatRect rect((FX_FLOAT)left, (FX_FLOAT)bottom, (FX_FLOAT)right, (FX_FLOAT)top); CFX_WideString str = textpage->GetTextByRect(rect); if (buflen <= 0 || !buffer) { return str.GetLength(); } CFX_ByteString cbUTF16Str = str.UTF16LE_Encode(); int len = cbUTF16Str.GetLength() / sizeof(unsigned short); int size = buflen > len ? len : buflen; FXSYS_memcpy(buffer, cbUTF16Str.GetBuffer(size * sizeof(unsigned short)), size * sizeof(unsigned short)); cbUTF16Str.ReleaseBuffer(size * sizeof(unsigned short)); return size; } // Search // -1 for end DLLEXPORT FPDF_SCHHANDLE STDCALL FPDFText_FindStart(FPDF_TEXTPAGE text_page, FPDF_WIDESTRING findwhat, unsigned long flags, int start_index) { if (!text_page) return NULL; IPDF_TextPageFind* textpageFind = NULL; textpageFind = IPDF_TextPageFind::CreatePageFind((IPDF_TextPage*)text_page); FX_STRSIZE len = CFX_WideString::WStringLength(findwhat); textpageFind->FindFirst(CFX_WideString::FromUTF16LE(findwhat, len), flags, start_index); return textpageFind; } DLLEXPORT FPDF_BOOL STDCALL FPDFText_FindNext(FPDF_SCHHANDLE handle) { if (!handle) return FALSE; IPDF_TextPageFind* textpageFind = (IPDF_TextPageFind*)handle; return textpageFind->FindNext(); } DLLEXPORT FPDF_BOOL STDCALL FPDFText_FindPrev(FPDF_SCHHANDLE handle) { if (!handle) return FALSE; IPDF_TextPageFind* textpageFind = (IPDF_TextPageFind*)handle; return textpageFind->FindPrev(); } DLLEXPORT int STDCALL FPDFText_GetSchResultIndex(FPDF_SCHHANDLE handle) { if (!handle) return 0; IPDF_TextPageFind* textpageFind = (IPDF_TextPageFind*)handle; return textpageFind->GetCurOrder(); } DLLEXPORT int STDCALL FPDFText_GetSchCount(FPDF_SCHHANDLE handle) { if (!handle) return 0; IPDF_TextPageFind* textpageFind = (IPDF_TextPageFind*)handle; return textpageFind->GetMatchedCount(); } DLLEXPORT void STDCALL FPDFText_FindClose(FPDF_SCHHANDLE handle) { if (!handle) return; IPDF_TextPageFind* textpageFind = (IPDF_TextPageFind*)handle; delete textpageFind; handle = NULL; } // web link DLLEXPORT FPDF_PAGELINK STDCALL FPDFLink_LoadWebLinks(FPDF_TEXTPAGE text_page) { if (!text_page) return NULL; IPDF_LinkExtract* pageLink = NULL; pageLink = IPDF_LinkExtract::CreateLinkExtract(); pageLink->ExtractLinks((IPDF_TextPage*)text_page); return pageLink; } DLLEXPORT int STDCALL FPDFLink_CountWebLinks(FPDF_PAGELINK link_page) { if (!link_page) return 0; IPDF_LinkExtract* pageLink = (IPDF_LinkExtract*)link_page; return pageLink->CountLinks(); } DLLEXPORT int STDCALL FPDFLink_GetURL(FPDF_PAGELINK link_page, int link_index, unsigned short* buffer, int buflen) { if (!link_page) return 0; IPDF_LinkExtract* pageLink = (IPDF_LinkExtract*)link_page; CFX_WideString url = pageLink->GetURL(link_index); CFX_ByteString cbUTF16URL = url.UTF16LE_Encode(); int len = cbUTF16URL.GetLength() / sizeof(unsigned short); if (!buffer || buflen <= 0) return len; int size = len < buflen ? len : buflen; if (size > 0) { FXSYS_memcpy(buffer, cbUTF16URL.GetBuffer(size * sizeof(unsigned short)), size * sizeof(unsigned short)); cbUTF16URL.ReleaseBuffer(size * sizeof(unsigned short)); } return size; } DLLEXPORT int STDCALL FPDFLink_CountRects(FPDF_PAGELINK link_page, int link_index) { if (!link_page) return 0; IPDF_LinkExtract* pageLink = (IPDF_LinkExtract*)link_page; CFX_RectArray rectArray; pageLink->GetRects(link_index, rectArray); return rectArray.GetSize(); } DLLEXPORT void STDCALL FPDFLink_GetRect(FPDF_PAGELINK link_page, int link_index, int rect_index, double* left, double* top, double* right, double* bottom) { if (!link_page) return; IPDF_LinkExtract* pageLink = (IPDF_LinkExtract*)link_page; CFX_RectArray rectArray; pageLink->GetRects(link_index, rectArray); if (rect_index >= 0 && rect_index < rectArray.GetSize()) { CFX_FloatRect rect = rectArray.GetAt(rect_index); *left = rect.left; *right = rect.right; *top = rect.top; *bottom = rect.bottom; } } DLLEXPORT void STDCALL FPDFLink_CloseWebLinks(FPDF_PAGELINK link_page) { delete (IPDF_LinkExtract*)link_page; }