diff options
author | danglassey <danglassey> | 2002-08-14 09:57:17 +0000 |
---|---|---|
committer | danglassey <danglassey> | 2002-08-14 09:57:17 +0000 |
commit | c9458897ebbb739d8db83c80e06512d8a612f743 (patch) | |
tree | f8c5381045887e34388cc6b26cfccc254bf766dc /include/utf8transliterator.h | |
download | sword-sf-cvs-c9458897ebbb739d8db83c80e06512d8a612f743.tar.gz |
*** empty log message ***
Diffstat (limited to 'include/utf8transliterator.h')
-rw-r--r-- | include/utf8transliterator.h | 92 |
1 files changed, 92 insertions, 0 deletions
diff --git a/include/utf8transliterator.h b/include/utf8transliterator.h new file mode 100644 index 0000000..8e5175b --- /dev/null +++ b/include/utf8transliterator.h @@ -0,0 +1,92 @@ +/* + * + * Copyright 2001 CrossWire Bible Society (http://www.crosswire.org) + * CrossWire Bible Society + * P. O. Box 2528 + * Tempe, AZ 85280-2528 + * + * This program is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License as published by the + * Free Software Foundation version 2. + * + * This program is distributed in the hope that it will be useful, but + * WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * General Public License for more details. + * + */ + +#ifndef UTF8TRANSLITERATOR_H +#define UTF8TRANSLITERATOR_H + +enum scriptEnum {SE_OFF, SE_LATIN, /*one-way (to) transliterators*/ SE_BASICLATIN, SE_BETA, SE_BGREEK, /*two-way transliterators*/ SE_GREEK, SE_HEBREW, SE_CYRILLIC, SE_ARABIC, SE_SYRIAC, SE_KATAKANA, SE_HIRAGANA, SE_JAMO, SE_HANGUL, SE_DEVANAGARI, SE_TAMIL, SE_BENGALI, SE_GURMUKHI, SE_GUJARATI, SE_ORIYA, SE_TELUGU, SE_KANNADA, SE_MALAYALAM, SE_THAI, SE_GEORGIAN, SE_ARMENIAN, SE_ETHIOPIC, SE_GOTHIC, SE_UGARITIC, SE_COPTIC, /*one-way (from) transliterators*/ SE_HAN, SE_KANJI}; +#define NUMSCRIPTS 32 +#define NUMTARGETSCRIPTS 5 + +#include <swfilter.h> +#include <swmodule.h> + +#include <unicode/utypes.h> +#include <unicode/ucnv.h> +#include <unicode/ustring.h> +#include <unicode/uchar.h> + +#include <unicode/unistr.h> +#include <unicode/translit.h> + +#include <defs.h> +#include <map> + +struct SWTransData { + UnicodeString resource; + UTransDirection dir; +}; +typedef map <const UnicodeString, SWTransData> SWTransMap; +typedef pair<UnicodeString, SWTransData> SWTransPair; + + /** This Filter uses ICU for transliteration + */ +class SWDLLEXPORT UTF8Transliterator : public SWFilter +{ +private: + + char option; + + static const char optionstring[NUMTARGETSCRIPTS][16]; + + static const char optName[]; + static const char optTip[]; + static const char SW_RB_RULE_BASED_IDS[]; + static const char SW_RB_RULE[]; + static const char SW_RESDATA[]; + OptionsList options; + static SWTransMap transMap; + UErrorCode utf8status; + + void Load(UErrorCode &status); + void registerTrans(const UnicodeString& ID, const UnicodeString& resource, + UTransDirection dir, UErrorCode &status ); + bool checkTrans(const UnicodeString& ID, UErrorCode &status ); + Transliterator * createTrans(const UnicodeString& preID, const UnicodeString& ID, + const UnicodeString& postID, UTransDirection dir, UErrorCode &status ); + + public: + UTF8Transliterator (); + virtual char ProcessText (char *text, int maxlen, const SWKey * key, const SWModule * = 0); + virtual const char *getOptionName () + { + return optName; + } + virtual const char *getOptionTip () + { + return optTip; + } + virtual void setOptionValue (const char *ival); + virtual const char *getOptionValue (); + virtual OptionsList getOptionValues () + { + return options; + } +}; + +#endif |