summaryrefslogtreecommitdiff
path: root/include/utf8transliterator.h
diff options
context:
space:
mode:
authorRoberto C. Sanchez <roberto@connexer.com>2014-03-29 10:53:49 -0400
committerRoberto C. Sanchez <roberto@connexer.com>2014-03-29 10:53:49 -0400
commit8c8aa6b07e595cfac56838b5964ab3e96051f1b2 (patch)
treeda38e2c1979148dbd3b0c7b87f930746f5ba7f44 /include/utf8transliterator.h
parent8d3fc864d094eeadc721f8e93436b37a5fab173e (diff)
Imported Upstream version 1.5.7
Diffstat (limited to 'include/utf8transliterator.h')
-rw-r--r--include/utf8transliterator.h93
1 files changed, 53 insertions, 40 deletions
diff --git a/include/utf8transliterator.h b/include/utf8transliterator.h
index b28d699..0956118 100644
--- a/include/utf8transliterator.h
+++ b/include/utf8transliterator.h
@@ -1,4 +1,6 @@
-/*
+/******************************************************************************
+ *
+ * $Id: utf8transliterator.h,v 1.22 2003/10/05 19:07:35 mgruner Exp $
*
* Copyright 2001 CrossWire Bible Society (http://www.crosswire.org)
* CrossWire Bible Society
@@ -15,59 +17,70 @@
* General Public License for more details.
*
*/
-#ifdef _ICU_
#ifndef UTF8TRANSLITERATOR_H
#define UTF8TRANSLITERATOR_H
-enum scriptEnum {SE_OFF, SE_LATIN, /*one-way (to) transliterators*/ SE_BASICLATIN, SE_BETA, SE_BGREEK, /*two-way transliterators*/ SE_GREEK, SE_HEBREW, SE_CYRILLIC, SE_ARABIC, SE_SYRIAC, SE_KATAKANA, SE_HIRAGANA, SE_JAMO, SE_HANGUL, SE_DEVANAGARI, SE_TAMIL, SE_BENGALI, SE_GURMUKHI, SE_GUJARATI, SE_ORIYA, SE_TELUGU, SE_KANNADA, SE_MALAYALAM, SE_THAI, SE_GEORGIAN, SE_ARMENIAN, SE_ETHIOPIC, SE_GOTHIC, SE_UGARITIC, SE_COPTIC, /*one-way (from) transliterators*/ SE_HAN, SE_KANJI};
-#define NUMSCRIPTS 32
-#define NUMTARGETSCRIPTS 5
+enum scriptEnum {SE_OFF, SE_LATIN, /*one-way (to) transliterators*/ SE_IPA, SE_BASICLATIN, SE_SBL, SE_TC, SE_BETA, SE_BGREEK, SE_SERA, SE_HUGOYE, SE_UNGEGN, SE_ISO, SE_ALALC, SE_BGNPCGN, /*two-way transliterators*/ SE_GREEK, SE_HEBREW, SE_CYRILLIC, SE_ARABIC, SE_SYRIAC, SE_KATAKANA, SE_HIRAGANA, SE_HANGUL, SE_DEVANAGARI, SE_TAMIL, SE_BENGALI, SE_GURMUKHI, SE_GUJARATI, SE_ORIYA, SE_TELUGU, SE_KANNADA, SE_MALAYALAM, SE_THAI, SE_GEORGIAN, SE_ARMENIAN, SE_ETHIOPIC, SE_GOTHIC, SE_UGARITIC, SE_COPTIC, SE_MEROITIC, SE_LINEARB, SE_CYPRIOT, SE_RUNIC, SE_OGHAM, SE_THAANA, SE_GLAGOLITIC, SE_TENGWAR, SE_CIRTH, /*one-way (from) transliterators*/ SE_JAMO, SE_HAN, SE_KANJI};
+#define NUMSCRIPTS 50
+#define NUMTARGETSCRIPTS NUMSCRIPTS-3//6
#include <swfilter.h>
#include <swmodule.h>
-#include <unicode/utypes.h>
-#include <unicode/ucnv.h>
-#include <unicode/ustring.h>
-#include <unicode/uchar.h>
-
#include <unicode/unistr.h>
+
#include <unicode/translit.h>
#include <defs.h>
+#include <map>
- /** This Filter shows/hides strong's numbers in a GBF text
- */
-class SWDLLEXPORT UTF8Transliterator : public SWFilter
-{
- char option;
-
- static const char optionstring[NUMTARGETSCRIPTS][16];
-
- static const char optName[];
- static const char optTip[];
- OptionsList options;
-
- public:
- UTF8Transliterator ();
- virtual char ProcessText (char *text, int maxlen, const SWKey * key, const SWModule * = 0);
- virtual const char *getOptionName ()
- {
- return optName;
- }
- virtual const char *getOptionTip ()
- {
- return optTip;
- }
- virtual void setOptionValue (const char *ival);
- virtual const char *getOptionValue ();
- virtual OptionsList getOptionValues ()
- {
- return options;
- }
+SWORD_NAMESPACE_START
+
+struct SWTransData {
+ UnicodeString resource;
+ UTransDirection dir;
};
+typedef std::map <const UnicodeString, SWTransData> SWTransMap;
+typedef std::pair<UnicodeString, SWTransData> SWTransPair;
-#endif
+// Chris, please add more javadoc-style documentation in this header file
+// so that the information will show up in the doxygen-generated
+// api-docs.
+
+/** This Filter uses ICU for transliteration
+*/
+class SWDLLEXPORT UTF8Transliterator : public SWFilter {
+private:
+
+ char option;
+
+ static const char optionstring[NUMTARGETSCRIPTS][16];
+
+ static const char optName[];
+ static const char optTip[];
+ static const char SW_RB_RULE_BASED_IDS[];
+ static const char SW_RB_RULE[];
+ static const char SW_RESDATA[];
+ StringList options;
+ static SWTransMap transMap;
+ UErrorCode utf8status;
+
+ void Load(UErrorCode &status);
+ void registerTrans(const UnicodeString& ID, const UnicodeString& resource, UTransDirection dir, UErrorCode &status);
+ bool addTrans(const char* newTrans, SWBuf* transList);
+ bool checkTrans(const UnicodeString& ID, UErrorCode &status);
+ Transliterator *createTrans(const UnicodeString& ID, UTransDirection dir, UErrorCode &status);
+
+public:
+ UTF8Transliterator();
+ virtual char processText(SWBuf &text, const SWKey *key = 0, const SWModule *module = 0);
+ virtual const char *getOptionName() { return optName; }
+ virtual const char *getOptionTip() { return optTip; }
+ virtual void setOptionValue(const char *ival);
+ virtual const char *getOptionValue();
+ virtual StringList getOptionValues() { return options; }
+};
+SWORD_NAMESPACE_END
#endif