1 /*
2  * CP1255.cs - Hebrew (Windows) code page.
3  *
4  * Copyright (c) 2002  Southern Storm Software, Pty Ltd
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining
7  * a copy of this software and associated documentation files (the "Software"),
8  * to deal in the Software without restriction, including without limitation
9  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10  * and/or sell copies of the Software, and to permit persons to whom the
11  * Software is furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice shall be included
14  * in all copies or substantial portions of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
17  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
20  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22  * OTHER DEALINGS IN THE SOFTWARE.
23  */
24 
25 // Generated from "ibm-5351.ucm".
26 
27 // WARNING: Modifying this file directly might be a bad idea.
28 // You should edit the code generator tools/ucm2cp.c instead for your changes
29 // to appear in all relevant classes.
30 namespace I18N.MidEast
31 {
32 
33 using System;
34 using System.Text;
35 using I18N.Common;
36 
37 [Serializable]
38 public class CP1255 : ByteEncoding
39 {
CP1255()40 	public CP1255()
41 		: base(1255, ToChars, "Hebrew (Windows)",
42 		       "windows-1255", "windows-1255", "windows-1255",
43 		       true, true, true, true, 1255)
44 	{}
45 
46 	private static readonly char[] ToChars = {
47 		'\u0000', '\u0001', '\u0002', '\u0003', '\u0004', '\u0005',
48 		'\u0006', '\u0007', '\u0008', '\u0009', '\u000A', '\u000B',
49 		'\u000C', '\u000D', '\u000E', '\u000F', '\u0010', '\u0011',
50 		'\u0012', '\u0013', '\u0014', '\u0015', '\u0016', '\u0017',
51 		'\u0018', '\u0019', '\u001A', '\u001B', '\u001C', '\u001D',
52 		'\u001E', '\u001F', '\u0020', '\u0021', '\u0022', '\u0023',
53 		'\u0024', '\u0025', '\u0026', '\u0027', '\u0028', '\u0029',
54 		'\u002A', '\u002B', '\u002C', '\u002D', '\u002E', '\u002F',
55 		'\u0030', '\u0031', '\u0032', '\u0033', '\u0034', '\u0035',
56 		'\u0036', '\u0037', '\u0038', '\u0039', '\u003A', '\u003B',
57 		'\u003C', '\u003D', '\u003E', '\u003F', '\u0040', '\u0041',
58 		'\u0042', '\u0043', '\u0044', '\u0045', '\u0046', '\u0047',
59 		'\u0048', '\u0049', '\u004A', '\u004B', '\u004C', '\u004D',
60 		'\u004E', '\u004F', '\u0050', '\u0051', '\u0052', '\u0053',
61 		'\u0054', '\u0055', '\u0056', '\u0057', '\u0058', '\u0059',
62 		'\u005A', '\u005B', '\u005C', '\u005D', '\u005E', '\u005F',
63 		'\u0060', '\u0061', '\u0062', '\u0063', '\u0064', '\u0065',
64 		'\u0066', '\u0067', '\u0068', '\u0069', '\u006A', '\u006B',
65 		'\u006C', '\u006D', '\u006E', '\u006F', '\u0070', '\u0071',
66 		'\u0072', '\u0073', '\u0074', '\u0075', '\u0076', '\u0077',
67 		'\u0078', '\u0079', '\u007A', '\u007B', '\u007C', '\u007D',
68 		'\u007E', '\u007F', '\u20AC', '\u0081', '\u201A', '\u0192',
69 		'\u201E', '\u2026', '\u2020', '\u2021', '\u02C6', '\u2030',
70 		'\u008A', '\u2039', '\u008C', '\u008D', '\u008E', '\u008F',
71 		'\u0090', '\u2018', '\u2019', '\u201C', '\u201D', '\u2022',
72 		'\u2013', '\u2014', '\u02DC', '\u2122', '\u009A', '\u203A',
73 		'\u009C', '\u009D', '\u009E', '\u009F', '\u00A0', '\u00A1',
74 		'\u00A2', '\u00A3', '\u20AA', '\u00A5', '\u00A6', '\u00A7',
75 		'\u00A8', '\u00A9', '\u00D7', '\u00AB', '\u00AC', '\u00AD',
76 		'\u00AE', '\u00AF', '\u00B0', '\u00B1', '\u00B2', '\u00B3',
77 		'\u00B4', '\u00B5', '\u00B6', '\u00B7', '\u00B8', '\u00B9',
78 		'\u00F7', '\u00BB', '\u00BC', '\u00BD', '\u00BE', '\u00BF',
79 		'\u05B0', '\u05B1', '\u05B2', '\u05B3', '\u05B4', '\u05B5',
80 		'\u05B6', '\u05B7', '\u05B8', '\u05B9', '\u003F', '\u05BB',
81 		'\u05BC', '\u05BD', '\u05BE', '\u05BF', '\u05C0', '\u05C1',
82 		'\u05C2', '\u05C3', '\u05F0', '\u05F1', '\u05F2', '\u05F3',
83 		'\u05F4', '\u003F', '\u003F', '\u003F', '\u003F', '\u003F',
84 		'\u003F', '\u003F', '\u05D0', '\u05D1', '\u05D2', '\u05D3',
85 		'\u05D4', '\u05D5', '\u05D6', '\u05D7', '\u05D8', '\u05D9',
86 		'\u05DA', '\u05DB', '\u05DC', '\u05DD', '\u05DE', '\u05DF',
87 		'\u05E0', '\u05E1', '\u05E2', '\u05E3', '\u05E4', '\u05E5',
88 		'\u05E6', '\u05E7', '\u05E8', '\u05E9', '\u05EA', '\u003F',
89 		'\u003F', '\u200E', '\u200F', '\u003F',
90 	};
91 
92 	// Get the number of bytes needed to encode a character buffer.
GetByteCountImpl(char* chars, int count)93 	public unsafe override int GetByteCountImpl (char* chars, int count)
94 	{
95 		if (this.EncoderFallback != null)		{
96 			//Calculate byte count by actually doing encoding and discarding the data.
97 			return GetBytesImpl(chars, count, null, 0);
98 		}
99 		else
100 		{
101 			return count;
102 		}
103 	}
104 
105 	// Get the number of bytes needed to encode a character buffer.
GetByteCount(String s)106 	public override int GetByteCount (String s)
107 	{
108 		if (this.EncoderFallback != null)
109 		{
110 			//Calculate byte count by actually doing encoding and discarding the data.
111 			unsafe
112 			{
113 				fixed (char *s_ptr = s)
114 				{
115 					return GetBytesImpl(s_ptr, s.Length, null, 0);
116 				}
117 			}
118 		}
119 		else
120 		{
121 			//byte count equals character count because no EncoderFallback set
122 			return s.Length;
123 		}
124 	}
125 
126 	//ToBytes is just an alias for GetBytesImpl, but doesn't return byte count
ToBytes(char* chars, int charCount, byte* bytes, int byteCount)127 	protected unsafe override void ToBytes(char* chars, int charCount,
128 	                                byte* bytes, int byteCount)
129 	{
130 		//Calling ToBytes with null destination buffer doesn't make any sense
131 		if (bytes == null)
132 			throw new ArgumentNullException("bytes");
133 		GetBytesImpl(chars, charCount, bytes, byteCount);
134 	}
135 
GetBytesImpl(char* chars, int charCount, byte* bytes, int byteCount)136 	public unsafe override int GetBytesImpl (char* chars, int charCount,
137 	                                         byte* bytes, int byteCount)
138 	{
139 		int ch;
140 		int charIndex = 0;
141 		int byteIndex = 0;
142 		EncoderFallbackBuffer buffer = null;
143 		while (charCount > 0)
144 		{
145 			ch = (int)(chars[charIndex]);
146 			if(ch >= 128) switch(ch)
147 			{
148 				case 0x0081:
149 				case 0x008A:
150 				case 0x008C:
151 				case 0x008D:
152 				case 0x008E:
153 				case 0x008F:
154 				case 0x0090:
155 				case 0x009A:
156 				case 0x009C:
157 				case 0x009D:
158 				case 0x009E:
159 				case 0x009F:
160 				case 0x00A0:
161 				case 0x00A1:
162 				case 0x00A2:
163 				case 0x00A3:
164 				case 0x00A5:
165 				case 0x00A6:
166 				case 0x00A7:
167 				case 0x00A8:
168 				case 0x00A9:
169 				case 0x00AB:
170 				case 0x00AC:
171 				case 0x00AD:
172 				case 0x00AE:
173 				case 0x00AF:
174 				case 0x00B0:
175 				case 0x00B1:
176 				case 0x00B2:
177 				case 0x00B3:
178 				case 0x00B4:
179 				case 0x00B5:
180 				case 0x00B6:
181 				case 0x00B7:
182 				case 0x00B8:
183 				case 0x00B9:
184 				case 0x00BB:
185 				case 0x00BC:
186 				case 0x00BD:
187 				case 0x00BE:
188 				case 0x00BF:
189 					break;
190 				case 0x00D7: ch = 0xAA; break;
191 				case 0x00F7: ch = 0xBA; break;
192 				case 0x0192: ch = 0x83; break;
193 				case 0x02C6: ch = 0x88; break;
194 				case 0x02DC: ch = 0x98; break;
195 				case 0x05B0:
196 				case 0x05B1:
197 				case 0x05B2:
198 				case 0x05B3:
199 				case 0x05B4:
200 				case 0x05B5:
201 				case 0x05B6:
202 				case 0x05B7:
203 				case 0x05B8:
204 				case 0x05B9:
205 					ch -= 0x04F0;
206 					break;
207 				case 0x05BB:
208 				case 0x05BC:
209 				case 0x05BD:
210 				case 0x05BE:
211 				case 0x05BF:
212 				case 0x05C0:
213 				case 0x05C1:
214 				case 0x05C2:
215 				case 0x05C3:
216 					ch -= 0x04F0;
217 					break;
218 				case 0x05D0:
219 				case 0x05D1:
220 				case 0x05D2:
221 				case 0x05D3:
222 				case 0x05D4:
223 				case 0x05D5:
224 				case 0x05D6:
225 				case 0x05D7:
226 				case 0x05D8:
227 				case 0x05D9:
228 				case 0x05DA:
229 				case 0x05DB:
230 				case 0x05DC:
231 				case 0x05DD:
232 				case 0x05DE:
233 				case 0x05DF:
234 				case 0x05E0:
235 				case 0x05E1:
236 				case 0x05E2:
237 				case 0x05E3:
238 				case 0x05E4:
239 				case 0x05E5:
240 				case 0x05E6:
241 				case 0x05E7:
242 				case 0x05E8:
243 				case 0x05E9:
244 				case 0x05EA:
245 					ch -= 0x04F0;
246 					break;
247 				case 0x05F0:
248 				case 0x05F1:
249 				case 0x05F2:
250 				case 0x05F3:
251 				case 0x05F4:
252 					ch -= 0x051C;
253 					break;
254 				case 0x200E: ch = 0xFD; break;
255 				case 0x200F: ch = 0xFE; break;
256 				case 0x2013: ch = 0x96; break;
257 				case 0x2014: ch = 0x97; break;
258 				case 0x2018: ch = 0x91; break;
259 				case 0x2019: ch = 0x92; break;
260 				case 0x201A: ch = 0x82; break;
261 				case 0x201C: ch = 0x93; break;
262 				case 0x201D: ch = 0x94; break;
263 				case 0x201E: ch = 0x84; break;
264 				case 0x2020: ch = 0x86; break;
265 				case 0x2021: ch = 0x87; break;
266 				case 0x2022: ch = 0x95; break;
267 				case 0x2026: ch = 0x85; break;
268 				case 0x2030: ch = 0x89; break;
269 				case 0x2039: ch = 0x8B; break;
270 				case 0x203A: ch = 0x9B; break;
271 				case 0x20AA: ch = 0xA4; break;
272 				case 0x20AC: ch = 0x80; break;
273 				case 0x2122: ch = 0x99; break;
274 				default:
275 				{
276 					if(ch >= 0xFF01 && ch <= 0xFF5E)
277 					{
278 						ch -= 0xFEE0;
279 					}
280 					else
281 					{
282 						HandleFallback (ref buffer, chars, ref charIndex, ref charCount, bytes, ref byteIndex, ref byteCount);
283 						charIndex++;
284 						charCount--;
285 						continue;
286 					}
287 				}
288 				break;
289 			}
290 			//Write encoded byte to buffer, if buffer is defined and fallback was not used
291 			if (bytes != null)
292 				bytes[byteIndex] = (byte)ch;
293 			byteIndex++;
294 			byteCount--;
295 			charIndex++;
296 			charCount--;
297 		}
298 		return byteIndex;
299 	}
300 }; // class CP1255
301 
302 [Serializable]
303 public class ENCwindows_1255 : CP1255
304 {
ENCwindows_1255()305 	public ENCwindows_1255() : base() {}
306 
307 }; // class ENCwindows_1255
308 
309 }; // namespace I18N.MidEast
310