- char * sort_key; // standard C string '\0' terminated
- char * norm_term; // standard C utf-8 string
- char * disp_term; // standard C utf-8 string
+ // type and action object
+ enum icu_chain_step_type type;
+ union {
+ struct icu_casemap * casemap;
+ struct icu_normalizer * normalizer;
+ struct icu_tokenizer * tokenizer;
+ } u;
+ // temprary post-action utf16 buffer
+ struct icu_buf_utf16 * buf16;
+ struct icu_chain_step * previous;
+ int more_tokens;
+ int need_new_token;
+};
+
+
+struct icu_chain;
+
+struct icu_chain_step * icu_chain_step_create(struct icu_chain * chain,
+ enum icu_chain_step_type type,
+ const uint8_t * rule,
+ struct icu_buf_utf16 * buf16,
+ UErrorCode *status);
+
+
+void icu_chain_step_destroy(struct icu_chain_step * step);
+
+
+struct icu_chain
+{
+ uint8_t identifier[128];
+ uint8_t locale[16];
+
+ // number of tokens returned so far
+ int32_t token_count;
+
+ // utf8 output buffers
+ struct icu_buf_utf8 * display8;
+ struct icu_buf_utf8 * norm8;
+ struct icu_buf_utf8 * sort8;
+
+ // utf16 source buffer
+ struct icu_buf_utf16 * src16;
+
+ // linked list of chain steps
+ struct icu_chain_step * steps;