summaryrefslogtreecommitdiff
path: root/public/fpdf_text.h
diff options
context:
space:
mode:
Diffstat (limited to 'public/fpdf_text.h')
-rw-r--r--public/fpdf_text.h265
1 files changed, 181 insertions, 84 deletions
diff --git a/public/fpdf_text.h b/public/fpdf_text.h
index 3c0afd2498..3046bb0f85 100644
--- a/public/fpdf_text.h
+++ b/public/fpdf_text.h
@@ -17,21 +17,26 @@ extern "C" {
// Function: FPDFText_LoadPage
// Prepare information about all characters in a page.
// Parameters:
-// page - Handle to the page. Returned by FPDF_LoadPage function (in FPDFVIEW module).
+// page - Handle to the page. Returned by FPDF_LoadPage function
+// (in FPDFVIEW module).
// Return value:
// A handle to the text page information structure.
// NULL if something goes wrong.
// Comments:
-// Application must call FPDFText_ClosePage to release the text page information.
+// Application must call FPDFText_ClosePage to release the text page
+// information.
// Notes:
-// The method can not support to load out FPDF_TEXTPAGE for the document consists of dynamic fields.
+// The method can not support to load out FPDF_TEXTPAGE for the
+// document consists of dynamic fields.
//
DLLEXPORT FPDF_TEXTPAGE STDCALL FPDFText_LoadPage(FPDF_PAGE page);
// Function: FPDFText_ClosePage
-// Release all resources allocated for a text page information structure.
+// Release all resources allocated for a text page information
+// structure.
// Parameters:
-// text_page - Handle to a text page information structure. Returned by FPDFText_LoadPage function.
+// text_page - Handle to a text page information structure.
+// Returned by FPDFText_LoadPage function.
// Return Value:
// None.
//
@@ -40,13 +45,17 @@ DLLEXPORT void STDCALL FPDFText_ClosePage(FPDF_TEXTPAGE text_page);
// Function: FPDFText_CountChars
// Get number of characters in a page.
// Parameters:
-// text_page - Handle to a text page information structure. Returned by FPDFText_LoadPage function.
+// text_page - Handle to a text page information structure.
+// Returned by FPDFText_LoadPage function.
// Return value:
// Number of characters in the page. Return -1 for error.
-// Generated characters, like additional space characters, new line characters, are also counted.
+// Generated characters, like additional space characters, new line
+// characters, are also counted.
// Comments:
-// Characters in a page form a "stream", inside the stream, each character has an index.
-// We will use the index parameters in many of FPDFTEXT functions. The first character in the page
+// Characters in a page form a "stream", inside the stream, each
+// character has an index.
+// We will use the index parameters in many of FPDFTEXT functions. The
+// first character in the page
// has an index value of zero.
//
DLLEXPORT int STDCALL FPDFText_CountChars(FPDF_TEXTPAGE text_page);
@@ -54,149 +63,213 @@ DLLEXPORT int STDCALL FPDFText_CountChars(FPDF_TEXTPAGE text_page);
// Function: FPDFText_GetUnicode
// Get Unicode of a character in a page.
// Parameters:
-// text_page - Handle to a text page information structure. Returned by FPDFText_LoadPage function.
+// text_page - Handle to a text page information structure.
+// Returned by FPDFText_LoadPage function.
// index - Zero-based index of the character.
// Return value:
// The Unicode of the particular character.
-// If a character is not encoded in Unicode and Foxit engine can't convert to Unicode,
+// If a character is not encoded in Unicode and Foxit engine can't
+// convert to Unicode,
// the return value will be zero.
//
-DLLEXPORT unsigned int STDCALL FPDFText_GetUnicode(FPDF_TEXTPAGE text_page, int index);
+DLLEXPORT unsigned int STDCALL FPDFText_GetUnicode(FPDF_TEXTPAGE text_page,
+ int index);
// Function: FPDFText_GetFontSize
// Get the font size of a particular character.
// Parameters:
-// text_page - Handle to a text page information structure. Returned by FPDFText_LoadPage function.
+// text_page - Handle to a text page information structure.
+// Returned by FPDFText_LoadPage function.
// index - Zero-based index of the character.
// Return value:
-// The font size of the particular character, measured in points (about 1/72 inch).
+// The font size of the particular character, measured in points (about
+// 1/72 inch).
// This is the typographic size of the font (so called "em size").
//
-DLLEXPORT double STDCALL FPDFText_GetFontSize(FPDF_TEXTPAGE text_page, int index);
+DLLEXPORT double STDCALL FPDFText_GetFontSize(FPDF_TEXTPAGE text_page,
+ int index);
// Function: FPDFText_GetCharBox
// Get bounding box of a particular character.
// Parameters:
-// text_page - Handle to a text page information structure. Returned by FPDFText_LoadPage function.
+// text_page - Handle to a text page information structure.
+// Returned by FPDFText_LoadPage function.
// index - Zero-based index of the character.
-// left - Pointer to a double number receiving left position of the character box.
-// right - Pointer to a double number receiving right position of the character box.
-// bottom - Pointer to a double number receiving bottom position of the character box.
-// top - Pointer to a double number receiving top position of the character box.
+// left - Pointer to a double number receiving left position
+// of the character box.
+// right - Pointer to a double number receiving right position
+// of the character box.
+// bottom - Pointer to a double number receiving bottom position
+// of the character box.
+// top - Pointer to a double number receiving top position of
+// the character box.
// Return Value:
// None.
// Comments:
// All positions are measured in PDF "user space".
//
-DLLEXPORT void STDCALL FPDFText_GetCharBox(FPDF_TEXTPAGE text_page, int index, double* left,
- double* right, double* bottom, double* top);
+DLLEXPORT void STDCALL FPDFText_GetCharBox(FPDF_TEXTPAGE text_page,
+ int index,
+ double* left,
+ double* right,
+ double* bottom,
+ double* top);
// Function: FPDFText_GetCharIndexAtPos
-// Get the index of a character at or nearby a certain position on the page.
+// Get the index of a character at or nearby a certain position on the
+// page.
// Parameters:
-// text_page - Handle to a text page information structure. Returned by FPDFText_LoadPage function.
+// text_page - Handle to a text page information structure.
+// Returned by FPDFText_LoadPage function.
// x - X position in PDF "user space".
// y - Y position in PDF "user space".
-// xTolerance - An x-axis tolerance value for character hit detection, in point unit.
-// yTolerance - A y-axis tolerance value for character hit detection, in point unit.
+// xTolerance - An x-axis tolerance value for character hit
+// detection, in point unit.
+// yTolerance - A y-axis tolerance value for character hit
+// detection, in point unit.
// Return Value:
// The zero-based index of the character at, or nearby the point (x,y).
-// If there is no character at or nearby the point, return value will be -1.
+// If there is no character at or nearby the point, return value will
+// be -1.
// If an error occurs, -3 will be returned.
//
DLLEXPORT int STDCALL FPDFText_GetCharIndexAtPos(FPDF_TEXTPAGE text_page,
- double x, double y, double xTorelance, double yTolerance);
+ double x,
+ double y,
+ double xTorelance,
+ double yTolerance);
// Function: FPDFText_GetText
// Extract unicode text string from the page.
// Parameters:
-// text_page - Handle to a text page information structure. Returned by FPDFText_LoadPage function.
+// text_page - Handle to a text page information structure.
+// Returned by FPDFText_LoadPage function.
// start_index - Index for the start characters.
// count - Number of characters to be extracted.
-// result - A buffer (allocated by application) receiving the extracted unicodes.
-// The size of the buffer must be able to hold the number of characters plus a terminator.
+// result - A buffer (allocated by application) receiving the
+// extracted unicodes.
+// The size of the buffer must be able to hold the
+// number of characters plus a terminator.
// Return Value:
-// Number of characters written into the result buffer, including the trailing terminator.
+// Number of characters written into the result buffer, including the
+// trailing terminator.
// Comments:
// This function ignores characters without unicode information.
//
-DLLEXPORT int STDCALL FPDFText_GetText(FPDF_TEXTPAGE text_page, int start_index, int count, unsigned short* result);
+DLLEXPORT int STDCALL FPDFText_GetText(FPDF_TEXTPAGE text_page,
+ int start_index,
+ int count,
+ unsigned short* result);
// Function: FPDFText_CountRects
// Count number of rectangular areas occupied by a segment of texts.
// Parameters:
-// text_page - Handle to a text page information structure. Returned by FPDFText_LoadPage function.
+// text_page - Handle to a text page information structure.
+// Returned by FPDFText_LoadPage function.
// start_index - Index for the start characters.
// count - Number of characters.
// Return value:
// Number of rectangles. Zero for error.
// Comments:
-// This function, along with FPDFText_GetRect can be used by applications to detect the position
-// on the page for a text segment, so proper areas can be highlighted or something.
-// FPDFTEXT will automatically merge small character boxes into bigger one if those characters
+// This function, along with FPDFText_GetRect can be used by
+// applications to detect the position
+// on the page for a text segment, so proper areas can be highlighted
+// or something.
+// FPDFTEXT will automatically merge small character boxes into bigger
+// one if those characters
// are on the same line and use same font settings.
//
-DLLEXPORT int STDCALL FPDFText_CountRects(FPDF_TEXTPAGE text_page, int start_index, int count);
+DLLEXPORT int STDCALL FPDFText_CountRects(FPDF_TEXTPAGE text_page,
+ int start_index,
+ int count);
// Function: FPDFText_GetRect
-// Get a rectangular area from the result generated by FPDFText_CountRects.
+// Get a rectangular area from the result generated by
+// FPDFText_CountRects.
// Parameters:
-// text_page - Handle to a text page information structure. Returned by FPDFText_LoadPage function.
+// text_page - Handle to a text page information structure.
+// Returned by FPDFText_LoadPage function.
// rect_index - Zero-based index for the rectangle.
-// left - Pointer to a double value receiving the rectangle left boundary.
-// top - Pointer to a double value receiving the rectangle top boundary.
-// right - Pointer to a double value receiving the rectangle right boundary.
-// bottom - Pointer to a double value receiving the rectangle bottom boundary.
+// left - Pointer to a double value receiving the rectangle
+// left boundary.
+// top - Pointer to a double value receiving the rectangle
+// top boundary.
+// right - Pointer to a double value receiving the rectangle
+// right boundary.
+// bottom - Pointer to a double value receiving the rectangle
+// bottom boundary.
// Return Value:
// None.
//
-DLLEXPORT void STDCALL FPDFText_GetRect(FPDF_TEXTPAGE text_page, int rect_index, double* left, double* top,
- double* right, double* bottom);
+DLLEXPORT void STDCALL FPDFText_GetRect(FPDF_TEXTPAGE text_page,
+ int rect_index,
+ double* left,
+ double* top,
+ double* right,
+ double* bottom);
// Function: FPDFText_GetBoundedText
// Extract unicode text within a rectangular boundary on the page.
// Parameters:
-// text_page - Handle to a text page information structure. Returned by FPDFText_LoadPage function.
+// text_page - Handle to a text page information structure.
+// Returned by FPDFText_LoadPage function.
// left - Left boundary.
// top - Top boundary.
// right - Right boundary.
// bottom - Bottom boundary.
// buffer - A unicode buffer.
-// buflen - Number of characters (not bytes) for the buffer, excluding an additional terminator.
+// buflen - Number of characters (not bytes) for the buffer,
+// excluding an additional terminator.
// Return Value:
-// If buffer is NULL or buflen is zero, return number of characters (not bytes) of text present within
-// the rectangle, excluding a terminating NUL. Generally you should pass a buffer at least one larger
-// than this if you want a terminating NUL, which will be provided if space is available.
-// Otherwise, return number of characters copied into the buffer, including the terminating NUL
+// If buffer is NULL or buflen is zero, return number of characters
+// (not bytes) of text present within
+// the rectangle, excluding a terminating NUL. Generally you should
+// pass a buffer at least one larger
+// than this if you want a terminating NUL, which will be provided if
+// space is available.
+// Otherwise, return number of characters copied into the buffer,
+// including the terminating NUL
// when space for it is available.
// Comment:
-// If the buffer is too small, as much text as will fit is copied into it.
+// If the buffer is too small, as much text as will fit is copied into
+// it.
//
-DLLEXPORT int STDCALL FPDFText_GetBoundedText(FPDF_TEXTPAGE text_page,double left, double top,
- double right, double bottom,unsigned short* buffer,int buflen);
-
+DLLEXPORT int STDCALL FPDFText_GetBoundedText(FPDF_TEXTPAGE text_page,
+ double left,
+ double top,
+ double right,
+ double bottom,
+ unsigned short* buffer,
+ int buflen);
// Flags used by FPDFText_FindStart function.
-#define FPDF_MATCHCASE 0x00000001 //If not set, it will not match case by default.
-#define FPDF_MATCHWHOLEWORD 0x00000002 //If not set, it will not match the whole word by default.
+#define FPDF_MATCHCASE \
+ 0x00000001 // If not set, it will not match case by default.
+#define FPDF_MATCHWHOLEWORD \
+ 0x00000002 // If not set, it will not match the whole word by default.
// Function: FPDFText_FindStart
// Start a search.
// Parameters:
-// text_page - Handle to a text page information structure. Returned by FPDFText_LoadPage function.
+// text_page - Handle to a text page information structure.
+// Returned by FPDFText_LoadPage function.
// findwhat - A unicode match pattern.
// flags - Option flags.
// start_index - Start from this character. -1 for end of the page.
// Return Value:
-// A handle for the search context. FPDFText_FindClose must be called to release this handle.
+// A handle for the search context. FPDFText_FindClose must be called
+// to release this handle.
//
-DLLEXPORT FPDF_SCHHANDLE STDCALL FPDFText_FindStart(FPDF_TEXTPAGE text_page, FPDF_WIDESTRING findwhat,
- unsigned long flags, int start_index);
+DLLEXPORT FPDF_SCHHANDLE STDCALL FPDFText_FindStart(FPDF_TEXTPAGE text_page,
+ FPDF_WIDESTRING findwhat,
+ unsigned long flags,
+ int start_index);
// Function: FPDFText_FindNext
// Search in the direction from page start to end.
// Parameters:
-// handle - A search context handle returned by FPDFText_FindStart.
+// handle - A search context handle returned by
+// FPDFText_FindStart.
// Return Value:
// Whether a match is found.
//
@@ -205,7 +278,8 @@ DLLEXPORT FPDF_BOOL STDCALL FPDFText_FindNext(FPDF_SCHHANDLE handle);
// Function: FPDFText_FindPrev
// Search in the direction from page end to start.
// Parameters:
-// handle - A search context handle returned by FPDFText_FindStart.
+// handle - A search context handle returned by
+// FPDFText_FindStart.
// Return Value:
// Whether a match is found.
//
@@ -214,7 +288,8 @@ DLLEXPORT FPDF_BOOL STDCALL FPDFText_FindPrev(FPDF_SCHHANDLE handle);
// Function: FPDFText_GetSchResultIndex
// Get the starting character index of the search result.
// Parameters:
-// handle - A search context handle returned by FPDFText_FindStart.
+// handle - A search context handle returned by
+// FPDFText_FindStart.
// Return Value:
// Index for the starting character.
//
@@ -223,7 +298,8 @@ DLLEXPORT int STDCALL FPDFText_GetSchResultIndex(FPDF_SCHHANDLE handle);
// Function: FPDFText_GetSchCount
// Get the number of matched characters in the search result.
// Parameters:
-// handle - A search context handle returned by FPDFText_FindStart.
+// handle - A search context handle returned by
+// FPDFText_FindStart.
// Return Value:
// Number of matched characters.
//
@@ -232,7 +308,8 @@ DLLEXPORT int STDCALL FPDFText_GetSchCount(FPDF_SCHHANDLE handle);
// Function: FPDFText_FindClose
// Release a search context.
// Parameters:
-// handle - A search context handle returned by FPDFText_FindStart.
+// handle - A search context handle returned by
+// FPDFText_FindStart.
// Return Value:
// None.
//
@@ -241,16 +318,22 @@ DLLEXPORT void STDCALL FPDFText_FindClose(FPDF_SCHHANDLE handle);
// Function: FPDFLink_LoadWebLinks
// Prepare information about weblinks in a page.
// Parameters:
-// text_page - Handle to a text page information structure. Returned by FPDFText_LoadPage function.
+// text_page - Handle to a text page information structure.
+// Returned by FPDFText_LoadPage function.
// Return Value:
// A handle to the page's links information structure.
// NULL if something goes wrong.
// Comments:
-// Weblinks are those links implicitly embedded in PDF pages. PDF also has a type of
-// annotation called "link", FPDFTEXT doesn't deal with that kind of link.
-// FPDFTEXT weblink feature is useful for automatically detecting links in the page
-// contents. For example, things like "http://www.foxitsoftware.com" will be detected,
-// so applications can allow user to click on those characters to activate the link,
+// Weblinks are those links implicitly embedded in PDF pages. PDF also
+// has a type of
+// annotation called "link", FPDFTEXT doesn't deal with that kind of
+// link.
+// FPDFTEXT weblink feature is useful for automatically detecting links
+// in the page
+// contents. For example, things like "http://www.foxitsoftware.com"
+// will be detected,
+// so applications can allow user to click on those characters to
+// activate the link,
// even the PDF doesn't come with link annotations.
//
// FPDFLink_CloseWebLinks must be called to release resources.
@@ -272,12 +355,17 @@ DLLEXPORT int STDCALL FPDFLink_CountWebLinks(FPDF_PAGELINK link_page);
// link_page - Handle returned by FPDFLink_LoadWebLinks.
// link_index - Zero-based index for the link.
// buffer - A unicode buffer.
-// buflen - Number of characters (not bytes) for the buffer, including an additional terminator.
+// buflen - Number of characters (not bytes) for the buffer,
+// including an additional terminator.
// Return Value:
-// If buffer is NULL or buflen is zero, return number of characters (not bytes and an additional terminator is also counted) needed,
+// If buffer is NULL or buflen is zero, return number of characters
+// (not bytes and an additional terminator is also counted) needed,
// otherwise, return number of characters copied into the buffer.
//
-DLLEXPORT int STDCALL FPDFLink_GetURL(FPDF_PAGELINK link_page, int link_index, unsigned short* buffer,int buflen);
+DLLEXPORT int STDCALL FPDFLink_GetURL(FPDF_PAGELINK link_page,
+ int link_index,
+ unsigned short* buffer,
+ int buflen);
// Function: FPDFLink_CountRects
// Count number of rectangular areas for the link.
@@ -287,7 +375,8 @@ DLLEXPORT int STDCALL FPDFLink_GetURL(FPDF_PAGELINK link_page, int link_index, u
// Return Value:
// Number of rectangular areas for the link.
//
-DLLEXPORT int STDCALL FPDFLink_CountRects(FPDF_PAGELINK link_page, int link_index);
+DLLEXPORT int STDCALL FPDFLink_CountRects(FPDF_PAGELINK link_page,
+ int link_index);
// Function: FPDFLink_GetRect
// Fetch the boundaries of a rectangle for a link.
@@ -295,15 +384,24 @@ DLLEXPORT int STDCALL FPDFLink_CountRects(FPDF_PAGELINK link_page, int link_inde
// link_page - Handle returned by FPDFLink_LoadWebLinks.
// link_index - Zero-based index for the link.
// rect_index - Zero-based index for a rectangle.
-// left - Pointer to a double value receiving the rectangle left boundary.
-// top - Pointer to a double value receiving the rectangle top boundary.
-// right - Pointer to a double value receiving the rectangle right boundary.
-// bottom - Pointer to a double value receiving the rectangle bottom boundary.
+// left - Pointer to a double value receiving the rectangle
+// left boundary.
+// top - Pointer to a double value receiving the rectangle
+// top boundary.
+// right - Pointer to a double value receiving the rectangle
+// right boundary.
+// bottom - Pointer to a double value receiving the rectangle
+// bottom boundary.
// Return Value:
// None.
//
-DLLEXPORT void STDCALL FPDFLink_GetRect(FPDF_PAGELINK link_page, int link_index, int rect_index,
- double* left, double* top,double* right, double* bottom);
+DLLEXPORT void STDCALL FPDFLink_GetRect(FPDF_PAGELINK link_page,
+ int link_index,
+ int rect_index,
+ double* left,
+ double* top,
+ double* right,
+ double* bottom);
// Function: FPDFLink_CloseWebLinks
// Release resources used by weblink feature.
@@ -314,7 +412,6 @@ DLLEXPORT void STDCALL FPDFLink_GetRect(FPDF_PAGELINK link_page, int link_index,
//
DLLEXPORT void STDCALL FPDFLink_CloseWebLinks(FPDF_PAGELINK link_page);
-
#ifdef __cplusplus
}
#endif