summaryrefslogtreecommitdiff
path: root/src/modules/filters/utf8bidireorder.cpp
blob: 902047a2b87372ba4d44c0179275da77ded517bf (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
/******************************************************************************
*
* utf8cnormalizer - SWFilter descendant to perform reordering of UTF-8
*                   text to visual order according to Unicode BiDi
*/

#ifdef _ICU_

#include <stdlib.h>

#ifdef __GNUC__
#include <unixstr.h>
#endif

#include <utf8bidireorder.h>

SWORD_NAMESPACE_START

UTF8BiDiReorder::UTF8BiDiReorder() {

        conv = ucnv_open("UTF-8", &err);

}

UTF8BiDiReorder::~UTF8BiDiReorder() {
        ucnv_close(conv);
}

char UTF8BiDiReorder::processText(SWBuf &text, const SWKey *key, const SWModule *module)
{
        UChar *ustr, *ustr2;
	if ((unsigned long)key < 2)	// hack, we're en(1)/de(0)ciphering
		return -1;
        
        int32_t len = text.length();
        ustr = new UChar[len]; //each char could become a surrogate pair

	// Convert UTF-8 string to UTF-16 (UChars)
        len = ucnv_toUChars(conv, ustr, len, text.c_str(), -1, &err);
        ustr2 = new UChar[len];

        UBiDi* bidi = ubidi_openSized(len + 1, 0, &err);
        ubidi_setPara(bidi, ustr, len, UBIDI_DEFAULT_RTL, NULL, &err);
        len = ubidi_writeReordered(bidi, ustr2, len,
                UBIDI_DO_MIRRORING | UBIDI_REMOVE_BIDI_CONTROLS, &err);
        ubidi_close(bidi);

//        len = ubidi_writeReverse(ustr, len, ustr2, len,
//                UBIDI_DO_MIRRORING | UBIDI_REMOVE_BIDI_CONTROLS, &err);

	   text.setSize(text.size()*2);
	   len = ucnv_fromUChars(conv, text.getRawData(), text.size(), ustr2, len, &err);
	   text.setSize(len);

        delete [] ustr2;
        delete [] ustr;
	return 0;
}

SWORD_NAMESPACE_END
#endif