|
#include <TextExtractor.h>
Public Member Functions | ||||
| int | GetNumGlyphs () | |||
| ||||
| void | GetBBox (double out_bbox[4]) | |||
| ||||
| void | GetQuad (double out_quad[8]) | |||
| ||||
| void | GetGlyphQuad (int glyph_idx, double out_quad[8]) | |||
| ||||
| Style | GetCharStyle (int char_idx) | |||
| ||||
| Style | GetStyle () | |||
| ||||
| int | GetStringLen () | |||
| ||||
| const Unicode * | GetString () | |||
| ||||
| Word | GetNextWord () | |||
| ||||
| int | GetCurrentNum () | |||
| ||||
| bool | IsValid () | |||
| ||||
| bool | operator== (const Word &) | |||
| bool | operator!= (const Word &) | |||
| Word () | ||||
Each word contains a sequence of characters in one or more styles (see TextExtractor::Style).
| pdftron::PDF::TextExtractor::Word::Word | ( | ) |
| int pdftron::PDF::TextExtractor::Word::GetNumGlyphs | ( | ) |
| void pdftron::PDF::TextExtractor::Word::GetBBox | ( | double | out_bbox[4] | ) |
| out_bbox | The bounding box for this word (in unrotated page coordinates). |
| void pdftron::PDF::TextExtractor::Word::GetQuad | ( | double | out_quad[8] | ) |
| out_quad | The quadrilateral representing a tight bounding box for this word (in unrotated page coordinates). |
| void pdftron::PDF::TextExtractor::Word::GetGlyphQuad | ( | int | glyph_idx, | |
| double | out_quad[8] | |||
| ) |
| glyph_idx | The index of a glyph in this word. |
| out_quad | The quadrilateral representing a tight bounding box for a given glyph in the word (in unrotated page coordinates). |
| Style pdftron::PDF::TextExtractor::Word::GetCharStyle | ( | int | char_idx | ) |
| char_idx | The index of a character in this word. |
| Style pdftron::PDF::TextExtractor::Word::GetStyle | ( | ) |
| int pdftron::PDF::TextExtractor::Word::GetStringLen | ( | ) |
| const Unicode* pdftron::PDF::TextExtractor::Word::GetString | ( | ) |
| Word pdftron::PDF::TextExtractor::Word::GetNextWord | ( | ) |
| int pdftron::PDF::TextExtractor::Word::GetCurrentNum | ( | ) |
A word that starts the line will return 0, whereas the last word in the line will return (line.GetNumWords()-1).
| bool pdftron::PDF::TextExtractor::Word::IsValid | ( | ) |
| bool pdftron::PDF::TextExtractor::Word::operator== | ( | const Word & | ) |
| bool pdftron::PDF::TextExtractor::Word::operator!= | ( | const Word & | ) |