Functions |
| bool | tesseract::TessBaseAPI::AdaptToWordStr (PageSegMode mode, const char *wordstr) |
| int * | tesseract::TessBaseAPI::AllWordConfidences () |
| PageIterator * | tesseract::TessBaseAPI::AnalyseLayout () |
| void | tesseract::TessBaseAPI::Clear () |
| static void | tesseract::TessBaseAPI::DeleteBlockList (BLOCK_LIST *block_list) |
| bool | tesseract::TessBaseAPI::DetectOS (OSResults *) |
| void | tesseract::TessBaseAPI::DumpPGM (const char *filename) |
| void | tesseract::TessBaseAPI::End () |
| BLOCK_LIST * | tesseract::TessBaseAPI::FindLinesCreateBlockList () |
| static ROW * | tesseract::TessBaseAPI::FindRowForBox (BLOCK_LIST *blocks, int left, int top, int right, int bottom) |
| void | tesseract::TessBaseAPI::GetBlockTextOrientations (int **block_orientation, bool **vertical_writing) |
| char * | tesseract::TessBaseAPI::GetBoxText (int page_number) |
| Boxa * | tesseract::TessBaseAPI::GetComponentImages (PageIteratorLevel level, bool text_only, Pixa **pixa, int **blockids) |
| Boxa * | tesseract::TessBaseAPI::GetConnectedComponents (Pixa **cc) |
| CubeRecoContext * | tesseract::TessBaseAPI::GetCubeRecoContext () const |
| const Dawg * | tesseract::TessBaseAPI::GetDawg (int i) const |
| void | tesseract::TessBaseAPI::GetFeaturesForBlob (TBLOB *blob, const DENORM &denorm, INT_FEATURE_ARRAY int_features, int *num_features, int *FeatureOutlineIndex) |
| char * | tesseract::TessBaseAPI::GetHOCRText (int page_number) |
| ResultIterator * | tesseract::TessBaseAPI::GetIterator () |
| MutableIterator * | tesseract::TessBaseAPI::GetMutableIterator () |
| Boxa * | tesseract::TessBaseAPI::GetRegions (Pixa **pixa) |
| Boxa * | tesseract::TessBaseAPI::GetStrips (Pixa **pixa, int **blockids) |
| bool | tesseract::TessBaseAPI::GetTextDirection (int *out_offset, float *out_slope) |
| Boxa * | tesseract::TessBaseAPI::GetTextlines (Pixa **pixa, int **blockids) |
| Pix * | tesseract::TessBaseAPI::GetThresholdedImage () |
| int | tesseract::TessBaseAPI::GetThresholdedImageScaleFactor () const |
| const char * | tesseract::TessBaseAPI::GetUnichar (int unichar_id) |
| char * | tesseract::TessBaseAPI::GetUNLVText () |
| char * | tesseract::TessBaseAPI::GetUTF8Text () |
| Boxa * | tesseract::TessBaseAPI::GetWords (Pixa **pixa) |
| void | tesseract::TessBaseAPI::InitTruthCallback (TruthCallback *cb) |
| int | tesseract::TessBaseAPI::IsValidWord (const char *word) |
| static TBLOB * | tesseract::TessBaseAPI::MakeTBLOB (Pix *pix) |
| static ROW * | tesseract::TessBaseAPI::MakeTessOCRRow (float baseline, float xheight, float descender, float ascender) |
| int | tesseract::TessBaseAPI::MeanTextConf () |
| static void | tesseract::TessBaseAPI::NormalizeTBLOB (TBLOB *tblob, ROW *row, bool numeric_mode, DENORM *denorm) |
| int | tesseract::TessBaseAPI::NumDawgs () const |
| OcrEngineMode const | tesseract::TessBaseAPI::oem () const |
| bool | tesseract::TessBaseAPI::ProcessPage (Pix *pix, int page_index, const char *filename, const char *retry_config, int timeout_millisec, STRING *text_out) |
| bool | tesseract::TessBaseAPI::ProcessPages (const char *filename, const char *retry_config, int timeout_millisec, STRING *text_out) |
| int | tesseract::TessBaseAPI::Recognize (ETEXT_DESC *monitor) |
| int | tesseract::TessBaseAPI::RecognizeForChopTest (ETEXT_DESC *monitor) |
| void | tesseract::TessBaseAPI::RunAdaptiveClassifier (TBLOB *blob, const DENORM &denorm, int num_max_matches, int *unichar_ids, float *ratings, int *num_matches_returned) |
| void | tesseract::TessBaseAPI::set_min_orientation_margin (double margin) |
| void | tesseract::TessBaseAPI::SetDictFunc (DictFunc f) |
| void | tesseract::TessBaseAPI::SetFillLatticeFunc (FillLatticeFunc f) |
| void | tesseract::TessBaseAPI::SetImage (const Pix *pix) |
| void | tesseract::TessBaseAPI::SetImage (const unsigned char *imagedata, int width, int height, int bytes_per_pixel, int bytes_per_line) |
| void | tesseract::TessBaseAPI::SetProbabilityInContextFunc (ProbabilityInContextFunc f) |
| void | tesseract::TessBaseAPI::SetRectangle (int left, int top, int width, int height) |
| void | tesseract::TessBaseAPI::SetSourceResolution (int ppi) |
| void | tesseract::TessBaseAPI::SetThresholder (ImageThresholder *thresholder) |
| Tesseract *const | tesseract::TessBaseAPI::tesseract () const |
The following methods break TesseractRect into pieces, so you can get hold of the thresholded image, get the text in different formats, get bounding boxes, confidences etc.
| PageIterator* tesseract::TessBaseAPI::AnalyseLayout |
( |
|
) |
[inherited] |
Runs page layout analysis in the mode set by SetPageSegMode. May optionally be called prior to Recognize to get access to just the page layout results. Returns an iterator to the results. Returns NULL on error. The returned iterator must be deleted after use. WARNING! This class points to data held within the TessBaseAPI class, and therefore can only be used while the TessBaseAPI class still exists and has not been subjected to a call of Init, SetImage, Recognize, Clear, End DetectOS, or anything else that changes the internal PAGE_RES.
| Boxa* tesseract::TessBaseAPI::GetComponentImages |
( |
PageIteratorLevel |
level, |
|
|
bool |
text_only, |
|
|
Pixa ** |
pixa, |
|
|
int ** |
blockids | |
|
) |
| | [inherited] |
Get the given level kind of components (block, textline, word etc.) as a leptonica-style Boxa, Pixa pair, in reading order. Can be called before or after Recognize. If blockids is not NULL, the block-id of each component is also returned as an array of one element per component. delete [] after use. If text_only is true, then only text components are returned.
| ResultIterator* tesseract::TessBaseAPI::GetIterator |
( |
|
) |
[inherited] |
Get a reading-order iterator to the results of LayoutAnalysis and/or Recognize. The returned iterator must be deleted after use. WARNING! This class points to data held within the TessBaseAPI class, and therefore can only be used while the TessBaseAPI class still exists and has not been subjected to a call of Init, SetImage, Recognize, Clear, End DetectOS, or anything else that changes the internal PAGE_RES.
| MutableIterator* tesseract::TessBaseAPI::GetMutableIterator |
( |
|
) |
[inherited] |
Get a mutable iterator to the results of LayoutAnalysis and/or Recognize. The returned iterator must be deleted after use. WARNING! This class points to data held within the TessBaseAPI class, and therefore can only be used while the TessBaseAPI class still exists and has not been subjected to a call of Init, SetImage, Recognize, Clear, End DetectOS, or anything else that changes the internal PAGE_RES.
| bool tesseract::TessBaseAPI::ProcessPages |
( |
const char * |
filename, |
|
|
const char * |
retry_config, |
|
|
int |
timeout_millisec, |
|
|
STRING * |
text_out | |
|
) |
| | [inherited] |
Recognizes all the pages in the named file, as a multi-page tiff or list of filenames, or single image, and gets the appropriate kind of text according to parameters: tessedit_create_boxfile, tessedit_make_boxes_from_boxes, tessedit_write_unlv, tessedit_create_hocr. Calls ProcessPage on each page in the input file, which may be a multi-page tiff, single-page other file format, or a plain text list of images to read. If tessedit_page_number is non-negative, processing begins at that page of a multi-page tiff file, or filelist. The text is returned in text_out. Returns false on error. If non-zero timeout_millisec terminates processing after the timeout on a single page. If non-NULL and non-empty, and some page fails for some reason, the page is reprocessed with the retry_config config file. Useful for interactively debugging a bad page.
| void tesseract::TessBaseAPI::SetImage |
( |
const unsigned char * |
imagedata, |
|
|
int |
width, |
|
|
int |
height, |
|
|
int |
bytes_per_pixel, |
|
|
int |
bytes_per_line | |
|
) |
| | [inherited] |
Provide an image for Tesseract to recognize. Format is as TesseractRect above. Does not copy the image buffer, or take ownership. The source image may be destroyed after Recognize is called, either explicitly or implicitly via one of the Get*Text functions. SetImage clears all recognition results, and sets the rectangle to the full image, so it may be followed immediately by a GetUTF8Text, and it will automatically perform recognition.
| void tesseract::TessBaseAPI::SetThresholder |
( |
ImageThresholder * |
thresholder |
) |
[inline, inherited] |
In extreme cases only, usually with a subclass of Thresholder, it is possible to provide a different Thresholder. The Thresholder may be preloaded with an image, settings etc, or they may be set after. Note that Tesseract takes ownership of the Thresholder and will delete it when it it is replaced or the API is destructed.
Definition at line 343 of file baseapi.h.