aboutsummaryrefslogtreecommitdiffstats
path: root/include/utf8transliterator.h
blob: 10b2bcfabed5f6ca9f7288010df241a45eff3abc (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
/*
 *
 * Copyright 2001 CrossWire Bible Society (http://www.crosswire.org)
 *	CrossWire Bible Society
 *	P. O. Box 2528
 *	Tempe, AZ  85280-2528
 *
 * This program is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License as published by the
 * Free Software Foundation version 2.
 *
 * This program is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * General Public License for more details.
 *
 */

#ifndef UTF8TRANSLITERATOR_H
#define UTF8TRANSLITERATOR_H

enum scriptEnum {SE_OFF, SE_LATIN, /*one-way (to) transliterators*/ SE_BASICLATIN, SE_BETA, SE_BGREEK, /*two-way transliterators*/ SE_GREEK, SE_HEBREW, SE_CYRILLIC, SE_ARABIC, SE_SYRIAC, SE_KATAKANA, SE_HIRAGANA, SE_JAMO, SE_HANGUL, SE_DEVANAGARI, SE_TAMIL, SE_BENGALI, SE_GURMUKHI, SE_GUJARATI, SE_ORIYA, SE_TELUGU, SE_KANNADA, SE_MALAYALAM, SE_THAI, SE_GEORGIAN, SE_ARMENIAN, SE_ETHIOPIC, SE_GOTHIC, SE_UGARITIC, SE_COPTIC, /*one-way (from) transliterators*/ SE_HAN, SE_KANJI};
#define NUMSCRIPTS 32
#define NUMTARGETSCRIPTS 5

#include <swfilter.h>
#include <swmodule.h>

//#include <unicode/utypes.h>
//#include <unicode/ucnv.h>
//#include <unicode/ustring.h>
//#include <unicode/uchar.h>

#include <unicode/unistr.h>
#include <unicode/translit.h>

#include <defs.h>
#include <map>


//class UnicodeString;

SWORD_NAMESPACE_START

struct SWTransData {
	UnicodeString resource;
	UTransDirection dir;
};
typedef std::map <const UnicodeString, SWTransData> SWTransMap;
typedef std::pair<UnicodeString, SWTransData> SWTransPair;

  /** This Filter uses ICU for transliteration
  */
class SWDLLEXPORT UTF8Transliterator : public SWFilter
{
private:

  char option;

  static const char optionstring[NUMTARGETSCRIPTS][16];

  static const char optName[];
  static const char optTip[];
  static const char SW_RB_RULE_BASED_IDS[];
  static const char SW_RB_RULE[];
  static const char SW_RESDATA[];
  OptionsList options;
  static SWTransMap transMap;
  UErrorCode utf8status;
  
  void Load(UErrorCode &status);
  void  registerTrans(const UnicodeString& ID, const UnicodeString& resource,
		UTransDirection dir, UErrorCode &status );
  bool checkTrans(const UnicodeString& ID, UErrorCode &status );
  Transliterator * createTrans(const UnicodeString& preID, const UnicodeString& ID, 
  	const UnicodeString& postID, UTransDirection dir, UErrorCode &status );
  
 public:
  UTF8Transliterator ();
  virtual char ProcessText (char *text, int maxlen, const SWKey * key, const SWModule * = 0);
  virtual const char *getOptionName ()
    {
      return optName;
    }
  virtual const char *getOptionTip ()
    {
      return optTip;
    }
  virtual void setOptionValue (const char *ival);
  virtual const char *getOptionValue ();
  virtual OptionsList getOptionValues ()
    {
      return options;
    }
};

SWORD_NAMESPACE_END
#endif