1 /*
2  * "streamable kanji code filter and converter"
3  * Copyright (c) 1998-2002 HappySize, Inc. All rights reserved.
4  *
5  * LICENSE NOTICES
6  *
7  * This file is part of "streamable kanji code filter and converter",
8  * which is distributed under the terms of GNU Lesser General Public
9  * License (version 2) as published by the Free Software Foundation.
10  *
11  * This software is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14  * GNU Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with "streamable kanji code filter and converter";
18  * if not, write to the Free Software Foundation, Inc., 59 Temple Place,
19  * Suite 330, Boston, MA  02111-1307  USA
20  *
21  * The author of this part: Den V. Tsopa <tdv@edisoft.ru>
22  *
23  */
24 /*
25  * The source code included in this files was separated from mbfilter_ru.c
26  * by moriyoshi koizumi <moriyoshi@php.net> on 4 dec 2002.
27  *
28  */
29 
30 #ifdef HAVE_CONFIG_H
31 #include "config.h"
32 #endif
33 
34 #include "mbfilter.h"
35 #include "mbfilter_koi8r.h"
36 #include "unicode_table_koi8r.h"
37 
38 static int mbfl_filt_ident_koi8r(int c, mbfl_identify_filter *filter);
39 
40 static const char *mbfl_encoding_koi8r_aliases[] = {"KOI8-R", "KOI8R", NULL};
41 
42 const mbfl_encoding mbfl_encoding_koi8r = {
43 	mbfl_no_encoding_koi8r,
44 	"KOI8-R",
45 	"KOI8-R",
46 	(const char *(*)[])&mbfl_encoding_koi8r_aliases,
47 	NULL,
48 	MBFL_ENCTYPE_SBCS,
49 	&vtbl_koi8r_wchar,
50 	&vtbl_wchar_koi8r
51 };
52 
53 const struct mbfl_identify_vtbl vtbl_identify_koi8r = {
54 	mbfl_no_encoding_koi8r,
55 	mbfl_filt_ident_common_ctor,
56 	mbfl_filt_ident_common_dtor,
57 	mbfl_filt_ident_koi8r
58 };
59 
60 const struct mbfl_convert_vtbl vtbl_wchar_koi8r = {
61 	mbfl_no_encoding_wchar,
62 	mbfl_no_encoding_koi8r,
63 	mbfl_filt_conv_common_ctor,
64 	mbfl_filt_conv_common_dtor,
65 	mbfl_filt_conv_wchar_koi8r,
66 	mbfl_filt_conv_common_flush
67 };
68 
69 const struct mbfl_convert_vtbl vtbl_koi8r_wchar = {
70 	mbfl_no_encoding_koi8r,
71 	mbfl_no_encoding_wchar,
72 	mbfl_filt_conv_common_ctor,
73 	mbfl_filt_conv_common_dtor,
74 	mbfl_filt_conv_koi8r_wchar,
75 	mbfl_filt_conv_common_flush
76 };
77 
78 #define CK(statement)	do { if ((statement) < 0) return (-1); } while (0)
79 
80 /*
81  * koi8r => wchar
82  */
83 int
mbfl_filt_conv_koi8r_wchar(int c,mbfl_convert_filter * filter)84 mbfl_filt_conv_koi8r_wchar(int c, mbfl_convert_filter *filter)
85 {
86 	int s;
87 
88 	if (c >= 0 && c < koi8r_ucs_table_min) {
89 		s = c;
90 	} else if (c >= koi8r_ucs_table_min && c < 0x100) {
91 		s = koi8r_ucs_table[c - koi8r_ucs_table_min];
92 		if (s <= 0) {
93 			s = c;
94 			s &= MBFL_WCSPLANE_MASK;
95 			s |= MBFL_WCSPLANE_KOI8R;
96 		}
97 	} else {
98 		s = c;
99 		s &= MBFL_WCSGROUP_MASK;
100 		s |= MBFL_WCSGROUP_THROUGH;
101 	}
102 
103 	CK((*filter->output_function)(s, filter->data));
104 
105 	return c;
106 }
107 
108 /*
109  * wchar => koi8r
110  */
111 int
mbfl_filt_conv_wchar_koi8r(int c,mbfl_convert_filter * filter)112 mbfl_filt_conv_wchar_koi8r(int c, mbfl_convert_filter *filter)
113 {
114 	int s, n;
115 
116 	if (c < 0x80) {
117 		s = c;
118 	} else {
119 		s = -1;
120 		n = koi8r_ucs_table_len-1;
121 		while (n >= 0) {
122 			if (c == koi8r_ucs_table[n]) {
123 				s = koi8r_ucs_table_min + n;
124 				break;
125 			}
126 			n--;
127 		}
128 		if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_KOI8R) {
129 			s = c & MBFL_WCSPLANE_MASK;
130 		}
131 	}
132 
133 	if (s >= 0) {
134 		CK((*filter->output_function)(s, filter->data));
135 	} else {
136 		CK(mbfl_filt_conv_illegal_output(c, filter));
137 	}
138 
139 	return c;
140 }
141 
mbfl_filt_ident_koi8r(int c,mbfl_identify_filter * filter)142 static int mbfl_filt_ident_koi8r(int c, mbfl_identify_filter *filter)
143 {
144 	if (c >= 0x80 && c < 0xff)
145 		filter->flag = 0;
146 	else
147 		filter->flag = 1; /* not it */
148 	return c;
149 }
150