token
module).
More...Data Structures | |
struct | Token |
Token. More... | |
struct | Tokenization |
Tokenization. More... | |
Typedefs | |
typedef GSList | TokenList |
List of tokens. | |
Functions | |
Tokenization | tokenize (const char *text, const gboolean text_follows, int(*is_delimiter)(int), int(*is_never_delimiter)(int), int(*is_glueable)(int)) |
void | tokenizationFree (Tokenization *tokenization) |
void | tokenizationDump (Tokenization *tokenization, const char *delimiter, int(*print)(const char *,...)) |
void | tokenDump (const Token *token, const char *delimiter, int(*print)(const char *,...)) |
gboolean | tokenMerge (TokenList *token_list1, TokenList *token_list2) |
void | tokenGetString (const Token *token, GString *output) |
token
module).
SlpTK Library 0.6.0
<token.h>
Antonin Merçay (revision on 15.12.2004)
void tokenDump | ( | const Token * | token, | |
const char * | delimiter, | |||
int(*)(const char *,...) | ||||
) |
Dump a token
[in] | token | The token to dump |
[in] | delimiter | The string to dump at the end of the token |
[in] | The printing function used to dump |
Affiche_Token
void tokenGetString | ( | const Token * | token, | |
GString * | output | |||
) |
Convert a token into its string representation
token | The token to convert | |
output | The string where to output |
Token2String
void tokenizationDump | ( | Tokenization * | tokenization, | |
const char * | delimiter, | |||
int(*)(const char *,...) | ||||
) |
Dump a tokenization
[in] | tokenization | The tokenization to dump |
[in] | delimiter | The string to dump at the end of each token |
[in] | The printing function used to dump |
Affiche_Tokenisation
void tokenizationFree | ( | Tokenization * | tokenization | ) |
Free the memory allowed to a tokenization
[in] | tokenization | The tokenization to free |
Libere_Tokenisation
Tokenization tokenize | ( | const char * | text, | |
const gboolean | text_follows, | |||
int(*)(int) | is_delimiter, | |||
int(*)(int) | is_never_delimiter, | |||
int(*)(int) | is_glueable | |||
) |
Tokenize an input string using the given character classification routines.
[in] | text | The input string to tokenize |
[in] | text_follows | A flag that tells if text that carries on the treated one may come. If text_follows is set and the tokenization of text ends in the middle of a word, the last token is ignored because it may be complete at the next treatment. |
[in] | is_delimiter | The routine recognizing the delimiter characters |
[in] | is_never_delimiter | The routine recognizing the characters that are never delimiters |
[in] | is_glueable | The routine recognizing the glueable characters |
Tokenise
Merge two tokens
token_list1 | The token list element of the first token to merge | |
token_list2 | The token list element of the second token to merge |
TRUE
) or not (FALSE
, i.e. the tokens are not joinable)Join_Token