typedef
struct
_t_PDDocTextFinder
*
PDDocTextFinder
;
| |
A pointer to an array that holds the matches.
| |
The number of matches in the matches array.
| |
|
| |
Page number where quad is located
| |
Matched phrase bounding quad
| |
|
| |
char * phrase ; | The matched phrase.
|
The length of matched phrase.
| |
A pointer to an array that holds the match's quad information.
| |
The number of quads in the quad array.
| |
|
Finds all regular expression (regex) matches for the given page range.
Only words within or partially within the page's crop box (see PDPageGetCropBox()) are included. Words outside the crop box are skipped.
There can be only one match list in existence at a time; clients must release the previous match list, using PDDocTextFinderReleaseMatchList(), before creating a new one.
Available only on Windows, Mac, and Linux platforms
PDDocTextFinderMatchList
PDDocTextFinderAcquireMatchList(
PDDocTextFinder
mObj
,
PDDoc
pdDoc
,
ASInt32
beginPageNumber
,
ASInt32
endPageNumber
,
const
char
*
regexstr
);
mObj | IN (Required) The document text finder used to acquire the match list.
|
pdDoc | IN (Required) The document to search for matches.
|
beginPageNumber | IN (Required) The beginning page number from which to search. The first page is
0 , not 1 as designated in Acrobat. Pass PDAllPages (see PDExpT.h) to sequentially process all pages in the document. |
endPageNumber | IN (Required) The end page number from which to search to. If beginPageNumber is set to PDAllPages, this parameter is ignored.
|
regexStr | IN (Required) Regular expression to use for search.
|
PDDocTextFinder
PDDocTextFinderCreate(
PDWordFinderConfig
wfConfig
);
wfConfig | IN (Required) The word finder configuration to be used to extract the words.
|
PDDocTextFinder
PDDocTextFinderCreateEx(
PDWordFinderConfig
wfConfig
,
PDDocTextFinderConfig
dtfConfig
);
wfConfig | IN (Required) The word finder configuration to be used to extract the words.
|
dtfConfig | IN (Required) The document text finder configuration to be used to configure the extracted text.
|
void
PDDocTextFinderDestroy(
PDDocTextFinder
mObj
);
mObj | IN (Required) The document text finder to destroy.
|
void
PDDocTextFinderReleaseMatchList(
PDDocTextFinder
mObj
);
mObj | IN (Required) A document text finder object.
|