diff options
author | Roberto C. Sanchez <roberto@connexer.com> | 2014-03-29 10:53:49 -0400 |
---|---|---|
committer | Roberto C. Sanchez <roberto@connexer.com> | 2014-03-29 10:53:49 -0400 |
commit | 8c8aa6b07e595cfac56838b5964ab3e96051f1b2 (patch) | |
tree | da38e2c1979148dbd3b0c7b87f930746f5ba7f44 /include/utf8transliterator.h | |
parent | 8d3fc864d094eeadc721f8e93436b37a5fab173e (diff) |
Imported Upstream version 1.5.7
Diffstat (limited to 'include/utf8transliterator.h')
-rw-r--r-- | include/utf8transliterator.h | 93 |
1 files changed, 53 insertions, 40 deletions
diff --git a/include/utf8transliterator.h b/include/utf8transliterator.h index b28d699..0956118 100644 --- a/include/utf8transliterator.h +++ b/include/utf8transliterator.h @@ -1,4 +1,6 @@ -/* +/****************************************************************************** + * + * $Id: utf8transliterator.h,v 1.22 2003/10/05 19:07:35 mgruner Exp $ * * Copyright 2001 CrossWire Bible Society (http://www.crosswire.org) * CrossWire Bible Society @@ -15,59 +17,70 @@ * General Public License for more details. * */ -#ifdef _ICU_ #ifndef UTF8TRANSLITERATOR_H #define UTF8TRANSLITERATOR_H -enum scriptEnum {SE_OFF, SE_LATIN, /*one-way (to) transliterators*/ SE_BASICLATIN, SE_BETA, SE_BGREEK, /*two-way transliterators*/ SE_GREEK, SE_HEBREW, SE_CYRILLIC, SE_ARABIC, SE_SYRIAC, SE_KATAKANA, SE_HIRAGANA, SE_JAMO, SE_HANGUL, SE_DEVANAGARI, SE_TAMIL, SE_BENGALI, SE_GURMUKHI, SE_GUJARATI, SE_ORIYA, SE_TELUGU, SE_KANNADA, SE_MALAYALAM, SE_THAI, SE_GEORGIAN, SE_ARMENIAN, SE_ETHIOPIC, SE_GOTHIC, SE_UGARITIC, SE_COPTIC, /*one-way (from) transliterators*/ SE_HAN, SE_KANJI}; -#define NUMSCRIPTS 32 -#define NUMTARGETSCRIPTS 5 +enum scriptEnum {SE_OFF, SE_LATIN, /*one-way (to) transliterators*/ SE_IPA, SE_BASICLATIN, SE_SBL, SE_TC, SE_BETA, SE_BGREEK, SE_SERA, SE_HUGOYE, SE_UNGEGN, SE_ISO, SE_ALALC, SE_BGNPCGN, /*two-way transliterators*/ SE_GREEK, SE_HEBREW, SE_CYRILLIC, SE_ARABIC, SE_SYRIAC, SE_KATAKANA, SE_HIRAGANA, SE_HANGUL, SE_DEVANAGARI, SE_TAMIL, SE_BENGALI, SE_GURMUKHI, SE_GUJARATI, SE_ORIYA, SE_TELUGU, SE_KANNADA, SE_MALAYALAM, SE_THAI, SE_GEORGIAN, SE_ARMENIAN, SE_ETHIOPIC, SE_GOTHIC, SE_UGARITIC, SE_COPTIC, SE_MEROITIC, SE_LINEARB, SE_CYPRIOT, SE_RUNIC, SE_OGHAM, SE_THAANA, SE_GLAGOLITIC, SE_TENGWAR, SE_CIRTH, /*one-way (from) transliterators*/ SE_JAMO, SE_HAN, SE_KANJI}; +#define NUMSCRIPTS 50 +#define NUMTARGETSCRIPTS NUMSCRIPTS-3//6 #include <swfilter.h> #include <swmodule.h> -#include <unicode/utypes.h> -#include <unicode/ucnv.h> -#include <unicode/ustring.h> -#include <unicode/uchar.h> - #include <unicode/unistr.h> + #include <unicode/translit.h> #include <defs.h> +#include <map> - /** This Filter shows/hides strong's numbers in a GBF text - */ -class SWDLLEXPORT UTF8Transliterator : public SWFilter -{ - char option; - - static const char optionstring[NUMTARGETSCRIPTS][16]; - - static const char optName[]; - static const char optTip[]; - OptionsList options; - - public: - UTF8Transliterator (); - virtual char ProcessText (char *text, int maxlen, const SWKey * key, const SWModule * = 0); - virtual const char *getOptionName () - { - return optName; - } - virtual const char *getOptionTip () - { - return optTip; - } - virtual void setOptionValue (const char *ival); - virtual const char *getOptionValue (); - virtual OptionsList getOptionValues () - { - return options; - } +SWORD_NAMESPACE_START + +struct SWTransData { + UnicodeString resource; + UTransDirection dir; }; +typedef std::map <const UnicodeString, SWTransData> SWTransMap; +typedef std::pair<UnicodeString, SWTransData> SWTransPair; -#endif +// Chris, please add more javadoc-style documentation in this header file +// so that the information will show up in the doxygen-generated +// api-docs. + +/** This Filter uses ICU for transliteration +*/ +class SWDLLEXPORT UTF8Transliterator : public SWFilter { +private: + + char option; + + static const char optionstring[NUMTARGETSCRIPTS][16]; + + static const char optName[]; + static const char optTip[]; + static const char SW_RB_RULE_BASED_IDS[]; + static const char SW_RB_RULE[]; + static const char SW_RESDATA[]; + StringList options; + static SWTransMap transMap; + UErrorCode utf8status; + + void Load(UErrorCode &status); + void registerTrans(const UnicodeString& ID, const UnicodeString& resource, UTransDirection dir, UErrorCode &status); + bool addTrans(const char* newTrans, SWBuf* transList); + bool checkTrans(const UnicodeString& ID, UErrorCode &status); + Transliterator *createTrans(const UnicodeString& ID, UTransDirection dir, UErrorCode &status); + +public: + UTF8Transliterator(); + virtual char processText(SWBuf &text, const SWKey *key = 0, const SWModule *module = 0); + virtual const char *getOptionName() { return optName; } + virtual const char *getOptionTip() { return optTip; } + virtual void setOptionValue(const char *ival); + virtual const char *getOptionValue(); + virtual StringList getOptionValues() { return options; } +}; +SWORD_NAMESPACE_END #endif |