diff options
Diffstat (limited to 'core/include/fpdftext')
-rw-r--r-- | core/include/fpdftext/fpdf_text.h | 346 |
1 files changed, 173 insertions, 173 deletions
diff --git a/core/include/fpdftext/fpdf_text.h b/core/include/fpdftext/fpdf_text.h index 8b5edc348f..2a5e4ac4bd 100644 --- a/core/include/fpdftext/fpdf_text.h +++ b/core/include/fpdftext/fpdf_text.h @@ -1,173 +1,173 @@ -// Copyright 2014 PDFium Authors. All rights reserved.
-// Use of this source code is governed by a BSD-style license that can be
-// found in the LICENSE file.
-
-// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
-
-#ifndef _FPDF_TEXT_H_
-#define _FPDF_TEXT_H_
-#ifndef _FPDF_PARSER_
-#include "../fpdfapi/fpdf_parser.h"
-#endif
-#ifndef _FPDF_PAGEOBJ_H_
-#include "../fpdfapi/fpdf_pageobj.h"
-#endif
-#ifndef _FPDF_PAGE_
-#include "../fpdfapi/fpdf_page.h"
-#endif
-class CPDF_PageObjects;
-#define PDF2TXT_AUTO_ROTATE 1
-#define PDF2TXT_AUTO_WIDTH 2
-#define PDF2TXT_KEEP_COLUMN 4
-#define PDF2TXT_USE_OCR 8
-#define PDF2TXT_INCLUDE_INVISIBLE 16
-void PDF_GetPageText(CFX_ByteStringArray& lines, CPDF_Document* pDoc, CPDF_Dictionary* pPage,
- int iMinWidth, FX_DWORD flags);
-void PDF_GetPageText_Unicode(CFX_WideStringArray& lines, CPDF_Document* pDoc, CPDF_Dictionary* pPage,
- int iMinWidth, FX_DWORD flags);
-void PDF_GetTextStream_Unicode(CFX_WideTextBuf& buffer, CPDF_Document* pDoc, CPDF_Dictionary* pPage,
- FX_DWORD flags);
-CFX_WideString PDF_GetFirstTextLine_Unicode(CPDF_Document* pDoc, CPDF_Dictionary* pPage);
-class IPDF_TextPage;
-class IPDF_LinkExtract;
-class IPDF_TextPageFind;
-#define CHAR_ERROR -1
-#define CHAR_NORMAL 0
-#define CHAR_GENERATED 1
-#define CHAR_UNUNICODE 2
-typedef struct {
- FX_WCHAR m_Unicode;
- FX_WCHAR m_Charcode;
- FX_INT32 m_Flag;
- FX_FLOAT m_FontSize;
- FX_FLOAT m_OriginX;
- FX_FLOAT m_OriginY;
- CFX_FloatRect m_CharBox;
- CPDF_TextObject* m_pTextObj;
- CFX_AffineMatrix m_Matrix;
-} FPDF_CHAR_INFO;
-typedef CFX_ArrayTemplate<CFX_FloatRect> CFX_RectArray;
-#define FPDFTEXT_LRTB 0
-#define FPDFTEXT_RLTB 1
-#define FPDFTEXT_TBRL 2
-#define FPDFTEXT_LEFT -1
-#define FPDFTEXT_RIGHT 1
-#define FPDFTEXT_UP -2
-#define FPDFTEXT_DOWN 2
-class IPDF_ReflowedPage;
-#define FPDFTEXT_WRITINGMODE_UNKNOW 0
-#define FPDFTEXT_WRITINGMODE_LRTB 1
-#define FPDFTEXT_WRITINGMODE_RLTB 2
-#define FPDFTEXT_WRITINGMODE_TBRL 3
-class CPDFText_ParseOptions : public CFX_Object
-{
-public:
-
- CPDFText_ParseOptions();
- FX_BOOL m_bGetCharCodeOnly;
- FX_BOOL m_bNormalizeObjs;
- FX_BOOL m_bOutputHyphen;
-};
-class IPDF_TextPage : public CFX_Object
-{
-public:
-
- virtual ~IPDF_TextPage() {}
- static IPDF_TextPage* CreateTextPage(const CPDF_Page* pPage, CPDFText_ParseOptions ParserOptions);
- static IPDF_TextPage* CreateTextPage(const CPDF_Page* pPage, int flags = 0);
- static IPDF_TextPage* CreateTextPage(const CPDF_PageObjects* pObjs, int flags = 0);
- static IPDF_TextPage* CreateReflowTextPage(IPDF_ReflowedPage* pRefPage);
-
- virtual void NormalizeObjects(FX_BOOL bNormalize) = 0;
-
- virtual FX_BOOL ParseTextPage() = 0;
-
-
- virtual FX_BOOL IsParsered() const = 0;
-public:
-
- virtual int CharIndexFromTextIndex(int TextIndex) const = 0;
-
- virtual int TextIndexFromCharIndex(int CharIndex) const = 0;
-
-
- virtual int CountChars() const = 0;
-
- virtual void GetCharInfo(int index, FPDF_CHAR_INFO & info) const = 0;
-
- virtual void GetRectArray(int start, int nCount, CFX_RectArray& rectArray) const = 0;
-
-
-
- virtual int GetIndexAtPos(CPDF_Point point, FX_FLOAT xTorelance, FX_FLOAT yTorelance) const = 0;
-
- virtual int GetIndexAtPos(FX_FLOAT x, FX_FLOAT y, FX_FLOAT xTorelance, FX_FLOAT yTorelance) const = 0;
-
- virtual int GetOrderByDirection(int index, int direction) const = 0;
-
- virtual CFX_WideString GetTextByRect(CFX_FloatRect rect) const = 0;
-
- virtual void GetRectsArrayByRect(CFX_FloatRect rect, CFX_RectArray& resRectArray) const = 0;
-
-
- virtual int CountRects(int start, int nCount) = 0;
-
- virtual void GetRect(int rectIndex, FX_FLOAT& left, FX_FLOAT& top, FX_FLOAT& right, FX_FLOAT &bottom) const = 0;
-
- virtual FX_BOOL GetBaselineRotate(int rectIndex, int& Rotate) = 0;
-
- virtual FX_BOOL GetBaselineRotate(CFX_FloatRect rect, int& Rotate) = 0;
-
- virtual int CountBoundedSegments(FX_FLOAT left, FX_FLOAT top, FX_FLOAT right, FX_FLOAT bottom, FX_BOOL bContains = FALSE) = 0;
-
- virtual void GetBoundedSegment(int index, int& start, int& count) const = 0;
-
-
- virtual int GetWordBreak(int index, int direction) const = 0;
-
- virtual CFX_WideString GetPageText(int start = 0, int nCount = -1 ) const = 0;
-};
-#define FPDFTEXT_MATCHCASE 0x00000001
-#define FPDFTEXT_MATCHWHOLEWORD 0x00000002
-#define FPDFTEXT_CONSECUTIVE 0x00000004
-class IPDF_TextPageFind : public CFX_Object
-{
-public:
-
- virtual ~IPDF_TextPageFind() {}
-
- static IPDF_TextPageFind* CreatePageFind(const IPDF_TextPage* pTextPage);
-public:
-
- virtual FX_BOOL FindFirst(CFX_WideString findwhat, int flags, int startPos = 0) = 0;
-
- virtual FX_BOOL FindNext() = 0;
-
- virtual FX_BOOL FindPrev() = 0;
-
- virtual void GetRectArray(CFX_RectArray& rects) const = 0;
-
- virtual int GetCurOrder() const = 0;
-
- virtual int GetMatchedCount() const = 0;
-};
-class IPDF_LinkExtract : public CFX_Object
-{
-public:
-
- virtual ~IPDF_LinkExtract() {}
-
- static IPDF_LinkExtract* CreateLinkExtract();
-
- virtual FX_BOOL ExtractLinks(const IPDF_TextPage* pTextPage) = 0;
-public:
-
- virtual int CountLinks() const = 0;
-
- virtual CFX_WideString GetURL(int index) const = 0;
-
- virtual void GetBoundedSegment(int index, int& start, int& count) const = 0;
-
- virtual void GetRects(int index, CFX_RectArray& rects) const = 0;
-};
-#endif
+// Copyright 2014 PDFium Authors. All rights reserved. +// Use of this source code is governed by a BSD-style license that can be +// found in the LICENSE file. + +// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com + +#ifndef _FPDF_TEXT_H_ +#define _FPDF_TEXT_H_ +#ifndef _FPDF_PARSER_ +#include "../fpdfapi/fpdf_parser.h" +#endif +#ifndef _FPDF_PAGEOBJ_H_ +#include "../fpdfapi/fpdf_pageobj.h" +#endif +#ifndef _FPDF_PAGE_ +#include "../fpdfapi/fpdf_page.h" +#endif +class CPDF_PageObjects; +#define PDF2TXT_AUTO_ROTATE 1 +#define PDF2TXT_AUTO_WIDTH 2 +#define PDF2TXT_KEEP_COLUMN 4 +#define PDF2TXT_USE_OCR 8 +#define PDF2TXT_INCLUDE_INVISIBLE 16 +void PDF_GetPageText(CFX_ByteStringArray& lines, CPDF_Document* pDoc, CPDF_Dictionary* pPage, + int iMinWidth, FX_DWORD flags); +void PDF_GetPageText_Unicode(CFX_WideStringArray& lines, CPDF_Document* pDoc, CPDF_Dictionary* pPage, + int iMinWidth, FX_DWORD flags); +void PDF_GetTextStream_Unicode(CFX_WideTextBuf& buffer, CPDF_Document* pDoc, CPDF_Dictionary* pPage, + FX_DWORD flags); +CFX_WideString PDF_GetFirstTextLine_Unicode(CPDF_Document* pDoc, CPDF_Dictionary* pPage); +class IPDF_TextPage; +class IPDF_LinkExtract; +class IPDF_TextPageFind; +#define CHAR_ERROR -1 +#define CHAR_NORMAL 0 +#define CHAR_GENERATED 1 +#define CHAR_UNUNICODE 2 +typedef struct { + FX_WCHAR m_Unicode; + FX_WCHAR m_Charcode; + FX_INT32 m_Flag; + FX_FLOAT m_FontSize; + FX_FLOAT m_OriginX; + FX_FLOAT m_OriginY; + CFX_FloatRect m_CharBox; + CPDF_TextObject* m_pTextObj; + CFX_AffineMatrix m_Matrix; +} FPDF_CHAR_INFO; +typedef CFX_ArrayTemplate<CFX_FloatRect> CFX_RectArray; +#define FPDFTEXT_LRTB 0 +#define FPDFTEXT_RLTB 1 +#define FPDFTEXT_TBRL 2 +#define FPDFTEXT_LEFT -1 +#define FPDFTEXT_RIGHT 1 +#define FPDFTEXT_UP -2 +#define FPDFTEXT_DOWN 2 +class IPDF_ReflowedPage; +#define FPDFTEXT_WRITINGMODE_UNKNOW 0 +#define FPDFTEXT_WRITINGMODE_LRTB 1 +#define FPDFTEXT_WRITINGMODE_RLTB 2 +#define FPDFTEXT_WRITINGMODE_TBRL 3 +class CPDFText_ParseOptions : public CFX_Object +{ +public: + + CPDFText_ParseOptions(); + FX_BOOL m_bGetCharCodeOnly; + FX_BOOL m_bNormalizeObjs; + FX_BOOL m_bOutputHyphen; +}; +class IPDF_TextPage : public CFX_Object +{ +public: + + virtual ~IPDF_TextPage() {} + static IPDF_TextPage* CreateTextPage(const CPDF_Page* pPage, CPDFText_ParseOptions ParserOptions); + static IPDF_TextPage* CreateTextPage(const CPDF_Page* pPage, int flags = 0); + static IPDF_TextPage* CreateTextPage(const CPDF_PageObjects* pObjs, int flags = 0); + static IPDF_TextPage* CreateReflowTextPage(IPDF_ReflowedPage* pRefPage); + + virtual void NormalizeObjects(FX_BOOL bNormalize) = 0; + + virtual FX_BOOL ParseTextPage() = 0; + + + virtual FX_BOOL IsParsered() const = 0; +public: + + virtual int CharIndexFromTextIndex(int TextIndex) const = 0; + + virtual int TextIndexFromCharIndex(int CharIndex) const = 0; + + + virtual int CountChars() const = 0; + + virtual void GetCharInfo(int index, FPDF_CHAR_INFO & info) const = 0; + + virtual void GetRectArray(int start, int nCount, CFX_RectArray& rectArray) const = 0; + + + + virtual int GetIndexAtPos(CPDF_Point point, FX_FLOAT xTorelance, FX_FLOAT yTorelance) const = 0; + + virtual int GetIndexAtPos(FX_FLOAT x, FX_FLOAT y, FX_FLOAT xTorelance, FX_FLOAT yTorelance) const = 0; + + virtual int GetOrderByDirection(int index, int direction) const = 0; + + virtual CFX_WideString GetTextByRect(CFX_FloatRect rect) const = 0; + + virtual void GetRectsArrayByRect(CFX_FloatRect rect, CFX_RectArray& resRectArray) const = 0; + + + virtual int CountRects(int start, int nCount) = 0; + + virtual void GetRect(int rectIndex, FX_FLOAT& left, FX_FLOAT& top, FX_FLOAT& right, FX_FLOAT &bottom) const = 0; + + virtual FX_BOOL GetBaselineRotate(int rectIndex, int& Rotate) = 0; + + virtual FX_BOOL GetBaselineRotate(CFX_FloatRect rect, int& Rotate) = 0; + + virtual int CountBoundedSegments(FX_FLOAT left, FX_FLOAT top, FX_FLOAT right, FX_FLOAT bottom, FX_BOOL bContains = FALSE) = 0; + + virtual void GetBoundedSegment(int index, int& start, int& count) const = 0; + + + virtual int GetWordBreak(int index, int direction) const = 0; + + virtual CFX_WideString GetPageText(int start = 0, int nCount = -1 ) const = 0; +}; +#define FPDFTEXT_MATCHCASE 0x00000001 +#define FPDFTEXT_MATCHWHOLEWORD 0x00000002 +#define FPDFTEXT_CONSECUTIVE 0x00000004 +class IPDF_TextPageFind : public CFX_Object +{ +public: + + virtual ~IPDF_TextPageFind() {} + + static IPDF_TextPageFind* CreatePageFind(const IPDF_TextPage* pTextPage); +public: + + virtual FX_BOOL FindFirst(CFX_WideString findwhat, int flags, int startPos = 0) = 0; + + virtual FX_BOOL FindNext() = 0; + + virtual FX_BOOL FindPrev() = 0; + + virtual void GetRectArray(CFX_RectArray& rects) const = 0; + + virtual int GetCurOrder() const = 0; + + virtual int GetMatchedCount() const = 0; +}; +class IPDF_LinkExtract : public CFX_Object +{ +public: + + virtual ~IPDF_LinkExtract() {} + + static IPDF_LinkExtract* CreateLinkExtract(); + + virtual FX_BOOL ExtractLinks(const IPDF_TextPage* pTextPage) = 0; +public: + + virtual int CountLinks() const = 0; + + virtual CFX_WideString GetURL(int index) const = 0; + + virtual void GetBoundedSegment(int index, int& start, int& count) const = 0; + + virtual void GetRects(int index, CFX_RectArray& rects) const = 0; +}; +#endif |