23 #endif // #ifndef _FX_NO_XFA_ 59 typedef enum _TextCharFlag {
273 typedef enum _TextParseFlags {
287 typedef enum _TextOrderFlag {
521 typedef enum _SearchFlags {
565 #endif // #ifndef _FX_NO_XFA_ 636 bool SetPattern(
const wchar_t* key_words,
bool is_regex_search =
false);
954 #endif // FS_SEARCH_H_ int GetMatchStartCharIndex() const
Get the index of the first character of current match pattern, based on current match page.
common::Range GetCharRange(const RectF &rect)
Get the character index range of all text rectangles within the specified rectangle region.
TextOrderFlag
Enumeration for text order flag which is used when getting text content of a PDF page.
Definition: fs_search.h:287
bool IsEmpty() const
Check whether current object is empty or not.
PageTextLinks(const TextPage &page)
Constructor, from a parsed PDF page.
bool operator==(const TextLink &other) const
Equal operator.
bool operator==(const PageTextLinks &other) const
Equal operator.
If set, match the case of keyword when searching.
Definition: fs_search.h:525
Definition: fs_common.h:1273
TextSearch(const PDFDoc &document, SearchCancelCallback *cancel=0, int flags=foxit::pdf::TextPage::e_ParseTextNormal)
Constructor, for a PDF document.
Definition: fs_search.h:514
RectF char_box
The glyph bounding box in page space.
Definition: fs_search.h:238
CFX_Object Object
Object type.
Definition: fs_basictypes.h:221
bool FindPrev()
Search for previous matched pattern.
TextCharFlag
Enumeration for PDF textpage character flag.
Definition: fs_search.h:59
Character flag: Normal.
Definition: fs_search.h:63
TextPageCharInfo(const common::Font &font, TextCharFlag flag, float font_size, float origin_x, float origin_y, const RectF &char_box, const RectF &char_outbox, const Matrix &matrix)
Constructor, with parameters.
Definition: fs_search.h:90
RectFArray GetTextRectArrayByRect(const RectF &rect)
Get the array of all text rectangles within the specified rectangle region.
TextLink & operator=(const TextLink &other)
Assign operator.
common::Range GetWordAtPos(float x, float y, float tolerance) const
Get the character range of a word at or around a specified position on the page, in PDF coordinate sy...
Character flag: Hyphen.
Definition: fs_search.h:69
bool SetStartPage(int page_index)
Set starting page index.
WIDE STRING CLASS.
Definition: fx_string.h:1461
common::Font font
A font for character.
Definition: fs_search.h:208
int GetMatchEndCharIndex() const
Get the index of the last character of current match pattern, based on current match page.
TextLink GetTextLink(int index)
Get a text link object by index.
Character flag: Generated.
Definition: fs_search.h:65
bool IsEmpty() const
Check whether current object is empty or not.
RectF char_outbox
The typographic(display and printing) bounding box in page space.
Definition: fs_search.h:243
Definition: fs_pdfdoc.h:648
bool operator !=(const TextPageCharInfo &char_info) const
Not equal operator.
Definition: fs_search.h:167
If set, match the whole word of keyword when searching.
Definition: fs_search.h:527
bool operator==(const TextSearch &other) const
Equal operator.
TextPageCharInfo(const TextPageCharInfo &char_info)
Constructor, with another character information object.
Definition: fs_search.h:114
RectFArray GetRects()
Get the text rectangles of current text link object.
bool IsEmpty() const
Check whether current object is empty or not.
bool SetStartCharacter(int char_index)
Set starting character index, from where the search process is to be started.
TextParseFlags
Enumeration for parsing flags used for text page.
Definition: fs_search.h:273
Character flag: UnUnicode.
Definition: fs_search.h:67
If set, match the key word consecutively when searching. For example, "CC" will be matched twice in "...
Definition: fs_search.h:529
int GetTextRectCount(int start=0, int count=-1)
Count the text rectangles within a range specified by a start index and count.
bool operator !=(const TextSearch &other) const
Not equal operator.
int GetTextLinkCount()
Get the count of the URL formatted texts, in related PDF page.
~PageTextLinks()
Destructor.
RectF GetTextRect(int rect_index) const
Get the text rectangle by the index.
bool operator !=(const TextLink &other) const
Not equal operator.
bool operator==(const TextPage &other) const
Equal operator.
TextSearch & operator=(const TextSearch &other)
Assign operator.
float font_size
Font size for character.
Definition: fs_search.h:223
Header file for annotation related definitions and classes.
TextCharFlag flag
Flags to indicate which properties of textpage character flag are meaningful.
Definition: fs_search.h:216
virtual bool NeedToCancelNow()=0
A callback function used to check whether to cancel the searching process or not.
WString GetText(TextOrderFlag flag) const
Get the page text.
PageTextLinks & operator=(const PageTextLinks &other)
Assign operator.
int GetCharCount() const
Get the count of all the characters.
Definition: fs_search.h:798
TextPageCharInfo GetCharInfo(int char_index)
Get character information of a specific character.
WString GetURI()
Get URI string.
FX_UINT32 uint32
32-bit unsigned integer.
Definition: fs_basictypes.h:196
Definition: fs_pdfpage.h:412
void * FS_HANDLE
Handle type.
Definition: fs_basictypes.h:214
Header file for common definitions and classes.
int GetMatchPageIndex() const
Get the page index, to which current match belongs.
If this is set, that means to get text content of a PDF page by the display order.
Definition: fs_search.h:291
Parse the text content of a PDF page by normalizing characters based on their positions in the PDF pa...
Definition: fs_search.h:275
WString GetTextInRect(const RectF &rect) const
Get the text within a rectangle, in PDF coordinate system.
TextPageCharInfo()
Constructor.
Definition: fs_search.h:103
bool IsEmpty() const
Check whether current object is empty or not.
Definition: fs_search.h:882
Definition: fs_basictypes.h:443
TextLink(const TextLink &other)
Constructor, with another text link object.
Character flag: Unknown.
Definition: fs_search.h:61
Header file for XFA related definitions and functions.
Header file for PDF page related definitions and classes.
bool FindNext()
Search for next matched pattern.
bool SetPattern(const wchar_t *key_words, bool is_regex_search=false)
Set keywords to search.
int GetEndCharIndex()
Get the index of last character of current hyper-link URI, based on PDF page.
Definition: fs_annot.h:994
common::Rotation GetBaselineRotation(int rect_index)
Get the text trend (as rotation) of a specified rectangle.
int GetIndexAtPos(float x, float y, float tolerance) const
Get the character index at or around a specified position on the page, in PDF coordinate system.
Definition: fs_common.h:1428
TextPage & operator=(const TextPage &other)
Assign operator.
Rotation
Enumeration for rotation.
Definition: fs_common.h:57
Foxit namespace.
Definition: fs_pdf3d.h:27
int GetMatchSentenceStartIndex()
Get the index of the first character of current matched pattern, based on the matched sentence.
TextPageCharInfo & operator=(const TextPageCharInfo &char_info)
Assign operator.
Definition: fs_search.h:132
Definition: fs_search.h:52
float origin_y
The y-coordinate of the origin position.
Definition: fs_search.h:233
WString GetTextUnderAnnot(annots::Annot &annot) const
Get the page text which intersect with a specified an annotation.
Matrix matrix
The matrix of the character.
Definition: fs_search.h:248
WString GetChars(int start=0, int count=-1) const
Get all the characters within a range specified by a start index and count.
bool operator !=(const TextPage &other) const
Not equal operator.
#define NULL
The null-pointer value.
Definition: fx_system.h:792
No special searching options.
Definition: fs_search.h:523
If set, to ignore full-width characters and treat all characters as standard ASCII or standard-width ...
Definition: fs_search.h:531
Definition: fx_coordinates.h:1076
WString GetMatchSentence()
Get the sentence that contains current match pattern.
void Set(const common::Font &font, TextCharFlag flag, float font_size, float origin_x, float origin_y, const RectF &char_box, const RectF &char_outbox, const Matrix &matrix)
Set value.
Definition: fs_search.h:193
int GetMatchSentenceEndIndex()
Get the index of the last character of current matched pattern, based on the matched sentence.
Parse the text content of a PDF page by the stream order.
Definition: fs_search.h:279
bool operator==(const TextPageCharInfo &char_info) const
Equal operator.
Definition: fs_search.h:151
SearchFlags
Enumeration for searching flags.
Definition: fs_search.h:521
TextPage(const PDFPage &page, int flags=foxit::pdf::TextPage::e_ParseTextNormal)
Constructor, from a parsed PDF page.
bool operator !=(const PageTextLinks &other) const
Not equal operator.
Definition: fs_search.h:266
Definition: fs_search.h:39
If this is set, that means to get text content of a PDF page by the stream order.
Definition: fs_search.h:289
Character flag: ComboWord.
Definition: fs_search.h:71
bool SetEndPage(int page_index)
Set ending page index.
bool SetSearchFlags(uint32 search_flags)
Set search flags.
Definition: fx_coordinates.h:771
RectFArray GetMatchRects() const
Get the rectangles of current match pattern.
int GetStartCharIndex()
Get the index of start character of current hyper-link URI, based on PDF page.
Parse the text content of a PDF page with outputting the hyphen on a line feed.
Definition: fs_search.h:277
float origin_x
The x-coordinate of the origin position.
Definition: fs_search.h:228