2 # Directory containing conversion tables.
3 # You have to unpack the conversion-tables.tar.gz package.
4 TABLESDIR
= /home
/bruno
/chs
/conversion-tables
129 ascii.h
: $(TABLESDIR
)/glibc-2.1
-iconv
/ASCII.TXT
8bit_tab_to_h
130 .
/8bit_tab_to_h ASCII ascii
< $<
132 iso8859_1.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-1.TXT
8bit_tab_to_h
133 .
/8bit_tab_to_h ISO-8859-1 iso8859_1
< $<
135 iso8859_2.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-2.TXT
8bit_tab_to_h
136 .
/8bit_tab_to_h ISO-8859-2 iso8859_2
< $<
138 iso8859_3.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-3.TXT
8bit_tab_to_h
139 .
/8bit_tab_to_h ISO-8859-3 iso8859_3
< $<
141 iso8859_4.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-4.TXT
8bit_tab_to_h
142 .
/8bit_tab_to_h ISO-8859-4 iso8859_4
< $<
144 iso8859_5.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-5.TXT
8bit_tab_to_h
145 .
/8bit_tab_to_h ISO-8859-5 iso8859_5
< $<
147 iso8859_6.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-6.TXT
8bit_tab_to_h
148 .
/8bit_tab_to_h ISO-8859-6 iso8859_6
< $<
150 iso8859_7.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-7-2003.TXT
8bit_tab_to_h
151 .
/8bit_tab_to_h ISO-8859-7 iso8859_7
< $<
153 iso8859_8.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-8.TXT
8bit_tab_to_h
154 .
/8bit_tab_to_h ISO-8859-8 iso8859_8
< $<
156 iso8859_9.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-9.TXT
8bit_tab_to_h
157 .
/8bit_tab_to_h ISO-8859-9 iso8859_9
< $<
159 iso8859_10.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-10.TXT
8bit_tab_to_h
160 .
/8bit_tab_to_h ISO-8859-10 iso8859_10
< $<
162 iso8859_11.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-11.TXT
8bit_tab_to_h
163 .
/8bit_tab_to_h ISO-8859-11 iso8859_11
< $<
165 iso8859_13.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-13.TXT
8bit_tab_to_h
166 .
/8bit_tab_to_h ISO-8859-13 iso8859_13
< $<
168 iso8859_14.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-14.TXT
8bit_tab_to_h
169 .
/8bit_tab_to_h ISO-8859-14 iso8859_14
< $<
171 iso8859_15.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-15.TXT
8bit_tab_to_h
172 .
/8bit_tab_to_h ISO-8859-15 iso8859_15
< $<
174 iso8859_16.h
: $(TABLESDIR
)/unicode.org-mappings
/ISO8859
/8859-16.TXT
8bit_tab_to_h
175 .
/8bit_tab_to_h ISO-8859-16 iso8859_16
< $<
177 koi8_r.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MISC
/KOI8-R.TXT
8bit_tab_to_h
178 .
/8bit_tab_to_h KOI8-R koi8_r
< $<
180 koi8_u.h
: $(TABLESDIR
)/csets-new
/KOI8-U.TXT
8bit_tab_to_h
181 .
/8bit_tab_to_h KOI8-U koi8_u
< $<
183 koi8_ru.h
: $(TABLESDIR
)/freebsd-iconv-0.4
/KOI8-RU.TXT
8bit_tab_to_h
184 .
/8bit_tab_to_h KOI8-RU koi8_ru
< $<
186 cp1250.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP1250.TXT
8bit_tab_to_h
187 .
/8bit_tab_to_h CP1250 cp1250
< $<
189 cp1251.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP1251.TXT
8bit_tab_to_h
190 .
/8bit_tab_to_h CP1251 cp1251
< $<
192 cp1252.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP1252.TXT
8bit_tab_to_h
193 .
/8bit_tab_to_h CP1252 cp1252
< $<
195 cp1253.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP1253.TXT
8bit_tab_to_h
196 .
/8bit_tab_to_h CP1253 cp1253
< $<
198 cp1254.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP1254.TXT
8bit_tab_to_h
199 .
/8bit_tab_to_h CP1254 cp1254
< $<
201 cp1255.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP1255.TXT
8bit_tab_to_h
202 .
/8bit_tab_to_h CP1255 cp1255
< $<
204 cp1256.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP1256.TXT
8bit_tab_to_h
205 .
/8bit_tab_to_h CP1256 cp1256
< $<
207 cp1257.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP1257.TXT
8bit_tab_to_h
208 .
/8bit_tab_to_h CP1257 cp1257
< $<
210 cp1258.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP1258.TXT
8bit_tab_to_h
211 .
/8bit_tab_to_h CP1258 cp1258
< $<
213 cp850.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP850.TXT
8bit_tab_to_h
214 .
/8bit_tab_to_h CP850 cp850
< $<
216 cp862.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP862.TXT
8bit_tab_to_h
217 .
/8bit_tab_to_h CP862 cp862
< $<
219 cp866.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP866.TXT
8bit_tab_to_h
220 .
/8bit_tab_to_h CP866 cp866
< $<
222 cp1131.h
: $(TABLESDIR
)/other
/CP1131.TXT
8bit_tab_to_h
223 (echo
'#' ; cat
$<) | .
/8bit_tab_to_h CP1131 cp1131
225 mac_roman.h
: $(TABLESDIR
)/jdk-1.1
.7b
/MAC-ROMAN.TXT
8bit_tab_to_h
226 .
/8bit_tab_to_h MacRoman mac_roman
< $<
228 mac_centraleurope.h
: $(TABLESDIR
)/jdk-1.1
.7b
/MAC-CENTRAL-EUROPE.TXT
8bit_tab_to_h
229 .
/8bit_tab_to_h MacCentralEurope mac_centraleurope
< $<
231 mac_iceland.h
: $(TABLESDIR
)/jdk-1.1
.7b
/MAC-ICELAND.TXT
8bit_tab_to_h
232 .
/8bit_tab_to_h MacIceland mac_iceland
< $<
234 mac_croatian.h
: $(TABLESDIR
)/jdk-1.1
.7b
/MAC-CROATIAN.TXT
8bit_tab_to_h
235 .
/8bit_tab_to_h MacCroatian mac_croatian
< $<
237 mac_romania.h
: $(TABLESDIR
)/jdk-1.1
.7b
/MAC-ROMANIA.TXT
8bit_tab_to_h
238 .
/8bit_tab_to_h MacRomania mac_romania
< $<
240 mac_cyrillic.h
: $(TABLESDIR
)/jdk-1.1
.7b
/MAC-CYRILLIC.TXT
8bit_tab_to_h
241 .
/8bit_tab_to_h MacCyrillic mac_cyrillic
< $<
243 mac_ukraine.h
: $(TABLESDIR
)/jdk-1.1
.7b
/MAC-UKRAINE.TXT
8bit_tab_to_h
244 .
/8bit_tab_to_h MacUkraine mac_ukraine
< $<
246 mac_greek.h
: $(TABLESDIR
)/jdk-1.1
.7b
/MAC-GREEK.TXT
8bit_tab_to_h
247 .
/8bit_tab_to_h MacGreek mac_greek
< $<
249 mac_turkish.h
: $(TABLESDIR
)/jdk-1.1
.7b
/MAC-TURKISH.TXT
8bit_tab_to_h
250 .
/8bit_tab_to_h MacTurkish mac_turkish
< $<
252 mac_hebrew.h
: $(TABLESDIR
)/jdk-1.1
.7b
/MAC-HEBREW.TXT
8bit_tab_to_h
253 .
/8bit_tab_to_h MacHebrew mac_hebrew
< $<
255 mac_arabic.h
: $(TABLESDIR
)/jdk-1.1
.7b
/MAC-ARABIC.TXT
8bit_tab_to_h
256 .
/8bit_tab_to_h MacArabic mac_arabic
< $<
258 mac_thai.h
: $(TABLESDIR
)/jdk-1.1
.7b
/MAC-THAI.TXT
8bit_tab_to_h
259 .
/8bit_tab_to_h MacThai mac_thai
< $<
261 hp_roman8.h
: $(TABLESDIR
)/glibc-2.1
-iconv
/HP-ROMAN8.TXT
8bit_tab_to_h
262 .
/8bit_tab_to_h HP-ROMAN8 hp_roman8
< $<
264 nextstep.h
: $(TABLESDIR
)/clisp
/NEXTSTEP.TXT
8bit_tab_to_h
265 .
/8bit_tab_to_h NEXTSTEP nextstep
< $<
267 armscii_8.h
: $(TABLESDIR
)/glibc-2.2
.90-iconv
/ARMSCII-8.TXT
8bit_tab_to_h
268 (echo
'#' ; cat
$<) | .
/8bit_tab_to_h ARMSCII-8 armscii_8
270 georgian_academy.h
: $(TABLESDIR
)/csets-1.6
/GEO-ITA.TXT
8bit_tab_to_h
271 .
/8bit_tab_to_h GEORGIAN-ACADEMY georgian_academy
< $<
273 georgian_ps.h
: $(TABLESDIR
)/csets-1.6
/GEO-PS.TXT
8bit_tab_to_h
274 .
/8bit_tab_to_h GEORGIAN-PS georgian_ps
< $<
276 koi8_t.h
: $(TABLESDIR
)/glibc-2.2
.90-iconv
/KOI8-T.TXT
277 (echo
'#' ; cat
$<) | .
/8bit_tab_to_h KOI8-T koi8_t
279 pt154.h
: $(TABLESDIR
)/IANA
/PTCP154.TXT
280 .
/8bit_tab_to_h PT154 pt154
< $<
282 rk1048.h
: $(TABLESDIR
)/IANA
/KZ-1048.TXT
283 (echo
'#' ; cat
$<) | .
/8bit_tab_to_h RK1048 rk1048
285 mulelao.h
: $(TABLESDIR
)/csets-new
/MULELAO1.TXT
8bit_tab_to_h
286 .
/8bit_tab_to_h MULELAO-1 mulelao
< $<
288 cp1133.h
: $(TABLESDIR
)/csets-new
/CP1133.TXT
8bit_tab_to_h
289 .
/8bit_tab_to_h IBM-CP1133 cp1133
< $<
291 tis620.h
: $(TABLESDIR
)/glibc-2.1
-iconv
/TIS-620.TXT
8bit_tab_to_h
292 .
/8bit_tab_to_h TIS620.2533
-1 tis620
< $<
294 cp874.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP874.TXT
8bit_tab_to_h
295 .
/8bit_tab_to_h CP874 cp874
< $<
297 viscii.h
: $(TABLESDIR
)/csets-1.6
/VISCII.TXT
8bit_tab_to_h
298 .
/8bit_tab_to_h VISCII1.1
-1 viscii
< $<
300 tcvn.h
: $(TABLESDIR
)/csets-1.6
/VN5712-1.TXT
8bit_tab_to_h
301 .
/8bit_tab_to_h TCVN-5712 tcvn
< $<
303 jisx0201.h
: $(TABLESDIR
)/clisp
/JIS_X0201.TXT
8bit_tab_to_h
304 .
/8bit_tab_to_h JISX0201.1976
-0 jisx0201
< $<
306 # We use modified JISX0208 and JISX0212 tables. Why?
307 # Hironori Sakamoto and Tomohiro Kubota explain that
308 # - EUC-JP and SHIFT_JIS contain JISX0208 exactly,
309 # - Their round-trip conversion to Unicode and back must be the identity,
310 # - Conversions between EUC-JP, SHIFT_JIS, CP932, ISO-2022-JP must behave
311 # as if no Unicode conversion was involved,
312 # - When JISX0208 is used as a CES (i.e. combined with ASCII) its mapping of
313 # REVERSE SOLIDUS becomes a FULLWIDTH REVERSE SOLIDUS, apparently because
314 # round-trip conversion stability is more important than a particular glyph.
315 # Only with CCS the character is a REVERSE SOLIDUS.
316 # As a consequence, we use FULLWIDTH REVERSE SOLIDUS in EUC-JP's JISX0208 part,
317 # and for consistency also in SHIFT_JIS and ISO-2022-JP, i.e. everywhere.
318 # JISX0208 never occurs as a CCS in practice. Similarly with JISX0212.
320 # Unicode.org maps 0x2140 to U+005C. We map it to U+FF3C.
321 jisx0208.h
: $(TABLESDIR
)/unicode.org-mappings
/EASTASIA
/JIS
/JIS0208.TXT cjk_tab_to_h
322 sed
-e
's,^0x....[ ]*\(0x....[ ]*0x.....*\)$$,\1,' < $< | sed
-e
's,\([ ]\)0x005C,\10xFF3C,' | .
/cjk_tab_to_h JISX0208.1990
-0 jisx0208
> $@
324 # Unicode.org maps 0x2237 to U+007E. We map it to U+FF5E.
325 jisx0212.h
: $(TABLESDIR
)/unicode.org-mappings
/EASTASIA
/JIS
/JIS0212.TXT cjk_tab_to_h
326 sed
-e
's,\([ ]\)0x007E,\10xFF5E,' < $< | .
/cjk_tab_to_h JISX0212.1990
-0 jisx0212
> $@
328 cp932ext.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP932.TXT cjk_tab_to_h
329 (echo
'#' ; grep
'^0x\(87\|E[D-F]\|F[0-9A-F]\)[0-9A-F][0-9A-F]' < $< ) | .
/cjk_tab_to_h
'CP932 extensions' cp932ext
> $@
331 gb2312.h
: $(TABLESDIR
)/unicode.org-mappings
/EASTASIA
/GB
/GB2312.TXT cjk_tab_to_h
332 .
/cjk_tab_to_h GB2312.1980
-0 gb2312
< $< > $@
334 isoir165ext.h
: $(TABLESDIR
)/csets-new
/ISO-IR-165-additions.TXT cjk_tab_to_h
335 (echo
'#' ; grep
-v
'^0x2[8A]' < $<) | .
/cjk_tab_to_h
'ISO-IR-165 extensions' isoir165ext
> $@
337 gb12345ext.h
: $(TABLESDIR
)/unicode.org-mappings
/EASTASIA
/GB
/GB2312.TXT
$(TABLESDIR
)/unicode.org-mappings
/EASTASIA
/GB
/GB12345-FIXED.TXT
$(TABLESDIR
)/csets-new
/GB12345-more.TXT cjk_tab_to_h
338 (echo
'#' ; sed
-e
'/^0x..[ ]*#UNDEFINED/d' -e
's/#.*$$//' -e
'/^[ ]*$$/d' $(TABLESDIR
)/unicode.org-mappings
/EASTASIA
/GB
/GB2312.TXT
> tmp1.TXT
; sed
-e
'/^0x..[ ]*#UNDEFINED/d' -e
's/#.*$$//' -e
'/^[ ]*$$/d' $(TABLESDIR
)/unicode.org-mappings
/EASTASIA
/GB
/GB12345-FIXED.TXT
> tmp2.TXT
; diff tmp1.TXT tmp2.TXT | grep
'^> ' | sed
-e
's,^> ,,' ; cat
$(TABLESDIR
)/csets-new
/GB12345-more.TXT
) | .
/cjk_tab_to_h
'GB/T 12345.1990-0 extensions' gb12345ext
> $@
&& rm -f tmp1.TXT tmp2.TXT
340 gbkext1.h
: GBKext.TXT cjk_tab_to_h
341 (echo
'#' ; grep
'^0x\([89].\|A0\)' < GBKext.TXT
) | .
/cjk_tab_to_h
'GBK/3 extensions' gbkext1
> $@
343 gbkext2.h
: GBKext.TXT cjk_tab_to_h
344 (echo
'#' ; grep
'^0x\(A[1-9A-F]\|[B-F][0-9A-F]\)\([4-9].\|A0\)' < GBKext.TXT
) | .
/cjk_tab_to_h
'GBK/4 and GBK/5 extensions' gbkext2
> $@
346 gbkext_inv.h
: GBKext.TXT cjk_tab_to_h
347 (echo
'#' ; grep
'^0x\([89].\|A0\)' < GBKext.TXT
; grep
'^0x\(A[1-9A-F]\|[B-F][0-9A-F]\)\([4-9].\|A0\)' < GBKext.TXT
) | .
/cjk_tab_to_h
'GBK extensions' gbkext_inv
> $@
349 cp936ext.h
: GBKext.TXT cjk_tab_to_h
350 (echo
'#' ; grep
'^0xA[1-9][B-F].' < GBKext.TXT
) | .
/cjk_tab_to_h
'CP936 extensions' cp936ext
> $@
352 GBKext.TXT
: $(TABLESDIR
)/unicode.org-mappings
/EASTASIA
/GB
/GB2312.TXT
$(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP936.TXT
353 sed
-e
's,^0x2,0xA,' -e
's,^0x3,0xB,' -e
's,^0x4,0xC,' -e
's,^0x5,0xD,' -e
's,^0x6,0xE,' -e
's,^0x7,0xF,' -e
's,^0x\(..\)2,0x\1A,' -e
's,^0x\(..\)3,0x\1B,' -e
's,^0x\(..\)4,0x\1C,' -e
's,^0x\(..\)5,0x\1D,' -e
's,^0x\(..\)6,0x\1E,' -e
's,^0x\(..\)7,0x\1F,' $(TABLESDIR
)/unicode.org-mappings
/EASTASIA
/GB
/GB2312.TXT
> tmpEUCCN.TXT
; sed
-e
'/^0x..[ ]*#UNDEFINED/d' -e
's/#.*$$//' -e
'/^[ ]*$$/d' tmpEUCCN.TXT
> tmp1.TXT
; sed
-e
'/^0x..[ ]/d' -e
's/#.*$$//' -e
'/^[ ]*$$/d' $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP936.TXT
> tmp2.TXT
; diff
-c1 tmp1.TXT tmp2.TXT | grep
'^+ ' | sed
-e
's,^+ ,,' > $@
&& rm -f tmpEUCCN.TXT tmp1.TXT tmp2.TXT
355 gb18030ext.h
: GB18030ext.TXT cjk_tab_to_h
356 (echo
'#' ; cat GB18030ext.TXT
) | .
/cjk_tab_to_h
'GB18030 two-byte extension' gb18030ext
> $@
358 GB18030ext.TXT
: $(TABLESDIR
)/glibc-2.2
.2-iconv
/GB18030.TXT
$(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP936.TXT
359 cat
$(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP936.TXT | sed
-e
's/[ ]*#.*$$//' | grep
'^0x[0-9A-F]* 0x....$$' > tmpGBK.TXT
; diff tmpGBK.TXT
$(TABLESDIR
)/glibc-2.2
.2-iconv
/GB18030.TXT | grep
'^> 0x.... 0x....$$' | sed
-e
's/^> //' > $@
&& rm -f tmpGBK.TXT
361 gb18030uni.h
: GB18030uni.TXT cjk_tab_to_h
362 .
/cjk_tab_to_h
'GB18030 four-byte extension' gb18030uni
< GB18030uni.TXT
> $@
364 GB18030uni.TXT
: $(TABLESDIR
)/gb18030
/filled-GB18030.TXT
365 grep
'^0x........ 0x....$$' < $(TABLESDIR
)/gb18030
/filled-GB18030.TXT
> $@
367 cns11643_1.h
: $(TABLESDIR
)/csets-new
/CNS11643-Unicode32.TXT cjk_tab_to_h
368 grep
'^\(#\|0x1\)' < $< | sed
-e
's,^0x1,0x,' | .
/cjk_tab_to_h
'CNS 11643-1992 plane 1' cns11643_1
> $@
370 cns11643_2.h
: $(TABLESDIR
)/csets-new
/CNS11643-Unicode32.TXT cjk_tab_to_h
371 grep
'^\(#\|0x2\)' < $< | sed
-e
's,^0x2,0x,' | .
/cjk_tab_to_h
'CNS 11643-1992 plane 2' cns11643_2
> $@
373 cns11643_3.h
: $(TABLESDIR
)/csets-new
/CNS11643-Unicode32.TXT cjk_tab_to_h
374 grep
'^\(#\|0x3\)' < $< | sed
-e
's,^0x3,0x,' | .
/cjk_tab_to_h
'CNS 11643-1992 plane 3' cns11643_3
> $@
376 cns11643_4a.h
: $(TABLESDIR
)/csets-new
/CNS11643-Unicode32.TXT cjk_tab_to_h
377 grep
'^\(#\|0x4[0-3]\)' < $< | sed
-e
's,^0x4,0x,' | .
/cjk_tab_to_h
'CNS 11643-1992 plane 4 part a' cns11643_4a
> $@
379 cns11643_4b.h
: $(TABLESDIR
)/csets-new
/CNS11643-Unicode32.TXT cjk_tab_to_h
380 grep
'^\(#\|0x4[4-7]\)' < $< | sed
-e
's,^0x4,0x,' | .
/cjk_tab_to_h
'CNS 11643-1992 plane 4 part b' cns11643_4b
> $@
382 cns11643_5.h
: $(TABLESDIR
)/csets-new
/CNS11643-Unicode32.TXT cjk_tab_to_h
383 grep
'^\(#\|0x5\)' < $< | sed
-e
's,^0x5,0x,' | .
/cjk_tab_to_h
'CNS 11643-1992 plane 5' cns11643_5
> $@
385 cns11643_6.h
: $(TABLESDIR
)/csets-new
/CNS11643-Unicode32.TXT cjk_tab_to_h
386 grep
'^\(#\|0x6\)' < $< | sed
-e
's,^0x6,0x,' | .
/cjk_tab_to_h
'CNS 11643-1992 plane 6' cns11643_6
> $@
388 cns11643_7.h
: $(TABLESDIR
)/csets-new
/CNS11643-Unicode32.TXT cjk_tab_to_h
389 grep
'^\(#\|0x7\)' < $< | sed
-e
's,^0x7,0x,' | .
/cjk_tab_to_h
'CNS 11643-1992 plane 7' cns11643_7
> $@
391 cns11643_15.h
: $(TABLESDIR
)/csets-new
/CNS11643-Unicode32.TXT cjk_tab_to_h
392 grep
'^\(#\|0xF\)' < $< | sed
-e
's,^0xF,0x,' | .
/cjk_tab_to_h
'CNS 11643-1992 plane 15' cns11643_15
> $@
394 cns11643_inv.h
: $(TABLESDIR
)/csets-new
/CNS11643-Unicode32.TXT cjk_tab_to_h
395 .
/cjk_tab_to_h
'CNS 11643-1992 planes 1-7, CNS 11643-1986 plane 15' cns11643_inv
< $< > $@
397 big5.h
: $(TABLESDIR
)/unicode.org-mappings
/EASTASIA
/OTHER
/BIG5.TXT cjk_tab_to_h
398 .
/cjk_tab_to_h BIG5 big5
< $< > $@
400 cp950ext.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/WINDOWS
/CP950.TXT cjk_tab_to_h
401 (echo
'#' ; grep
'^0xF9\(D[6-9A-F]\|[EF][0-9A-F]\)' < $< ) | .
/cjk_tab_to_h
'CP950 extensions' cp950ext
> $@
403 hkscs1999.h
: $(TABLESDIR
)/big5hkscs
/HKSCS-1999_2006.TXT cjk_tab_to_h
404 (echo
'#' ; grep
-v
, $<) | .
/cjk_tab_to_h HKSCS
:1999 hkscs1999
> $@
406 hkscs2001.h
: $(TABLESDIR
)/big5hkscs
/HKSCS-2001_2006-DELTA.TXT cjk_tab_to_h
407 (echo
'#' ; grep
-v
, $<) | .
/cjk_tab_to_h HKSCS
:2001 hkscs2001
> $@
409 hkscs2004.h
: $(TABLESDIR
)/big5hkscs
/HKSCS-2004_2006-DELTA.TXT cjk_tab_to_h
410 (echo
'#' ; grep
-v
, $<) | .
/cjk_tab_to_h HKSCS
:2004 hkscs2004
> $@
412 hkscs2008.h
: $(TABLESDIR
)/big5hkscs
/HKSCS-2008_2010-DELTA.TXT cjk_tab_to_h
413 (echo
'#' ; grep
-v
, $<) | .
/cjk_tab_to_h HKSCS
:2008 hkscs2008
> $@
415 # We use a modified KSC 5601 = KSX 1001 table. Jungshik Shin <jshin@mailaps.org>
416 # reports that Prof. GIM Geongseog (KIM Keyongseok) <gimgs@asadal.cs.pusan.ac.kr>
417 # (who represents South Korea in ISO/IEC JTC1 SC2/WG2 and SC22/WG20) says that
418 # these two characters were added to KSX 1001 in December 1998. According to
419 # http://std.dkuug.dk/jtc1/sc2/wg2/docs/N2815.doc, one more character
420 # (Korean postal code sign) was added in 2002.
421 ksc5601.h
: $(TABLESDIR
)/unicode.org-mappings
/EASTASIA
/KSC
/KSC5601.TXT cjk_tab_to_h
422 (cat
$< ; echo
'0xA2E6 0x20AC'; echo
'0xA2E7 0x00AE'; echo
'0xA2E8 0x327E') | .
/cjk_tab_to_h
'KSC5601.1987-0, now KS X 1001:2002' ksc5601
> $@
424 uhc_1.h
: $(TABLESDIR
)/unicode.org-mappings
/EASTASIA
/KSC
/KSC5601.TXT cjk_tab_to_h
425 (echo
'#' ; grep
'^0x\([8-9]\|A0\)' < $< ) | .
/cjk_tab_to_h
'Unified Hangul Code part 1' uhc_1
> $@
427 uhc_2.h
: $(TABLESDIR
)/unicode.org-mappings
/EASTASIA
/KSC
/KSC5601.TXT cjk_tab_to_h
428 (echo
'#' ; grep
'^0x\(A[1-9A-F]\|[B-F][0-9A-F]\)\([0-9]\|A0\)' < $< ) | .
/cjk_tab_to_h
'Unified Hangul Code part 2' uhc_2
> $@
430 johab_hangul.h
: $(TABLESDIR
)/unicode.org-mappings
/EASTASIA
/KSC
/JOHAB.TXT cjk_tab_to_h
431 (echo
'#' ; grep
'^0x\([8-C]...\|D[0-7]..\)' < $< ) | .
/cjk_tab_to_h
'JOHAB Hangul' johab_hangul
> $@
434 cp856.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MISC
/CP856.TXT
8bit_tab_to_h
435 .
/8bit_tab_to_h CP856 cp856
< $<
437 cp922.h
: $(TABLESDIR
)/aix-4.3
.2/IBM-922.TXT
8bit_tab_to_h
438 (echo
'#' ; cat
$<) | .
/8bit_tab_to_h CP922 cp922
440 cp1046.h
: $(TABLESDIR
)/aix-4.3
.2/IBM-1046.TXT
8bit_tab_to_h
441 (echo
'#' ; cat
$<) | .
/8bit_tab_to_h CP1046 cp1046
443 cp1124.h
: $(TABLESDIR
)/aix-4.3
.2/IBM-1124.TXT
8bit_tab_to_h
444 (echo
'#' ; cat
$<) | .
/8bit_tab_to_h CP1124 cp1124
446 cp1129.h
: $(TABLESDIR
)/aix-4.3
.2/IBM-1129.TXT
8bit_tab_to_h
447 (echo
'#' ; cat
$<) | .
/8bit_tab_to_h CP1129 cp1129
449 cp1161.h
: $(TABLESDIR
)/glibc-2.2
.90-iconv
/IBM1161.TXT
450 (echo
'#' ; cat
$(TABLESDIR
)/glibc-2.2
-iconv
/ASCII.TXT
; grep
-v
'^0x[0-7]' $<) | .
/8bit_tab_to_h CP1161 cp1161
452 cp1162.h
: $(TABLESDIR
)/glibc-2.2
.90-iconv
/IBM1162.TXT
453 (echo
'#' ; cat
$<) | .
/8bit_tab_to_h CP1162 cp1162
455 cp1163.h
: $(TABLESDIR
)/glibc-2.2
.90-iconv
/IBM1163.TXT
456 (echo
'#' ; cat
$<) | .
/8bit_tab_to_h CP1163 cp1163
459 cp437.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP437.TXT
8bit_tab_to_h
460 .
/8bit_tab_to_h CP437 cp437
< $<
462 cp737.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP737.TXT
8bit_tab_to_h
463 .
/8bit_tab_to_h CP737 cp737
< $<
465 cp775.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP775.TXT
8bit_tab_to_h
466 .
/8bit_tab_to_h CP775 cp775
< $<
468 cp852.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP852.TXT
8bit_tab_to_h
469 .
/8bit_tab_to_h CP852 cp852
< $<
471 cp853.h
: $(TABLESDIR
)/other
/CP853.TXT
8bit_tab_to_h
472 (echo
'#'; cat
$<) | .
/8bit_tab_to_h CP853 cp853
474 cp855.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP855.TXT
8bit_tab_to_h
475 .
/8bit_tab_to_h CP855 cp855
< $<
477 cp857.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP857.TXT
8bit_tab_to_h
478 .
/8bit_tab_to_h CP857 cp857
< $<
480 cp858.h
: $(TABLESDIR
)/windows-2000
/CP858.TXT
8bit_tab_to_h
481 (echo
'#' ; cat
$<) | .
/8bit_tab_to_h CP858 cp858
483 cp860.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP860.TXT
8bit_tab_to_h
484 .
/8bit_tab_to_h CP860 cp860
< $<
486 cp861.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP861.TXT
8bit_tab_to_h
487 .
/8bit_tab_to_h CP861 cp861
< $<
489 cp863.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP863.TXT
8bit_tab_to_h
490 .
/8bit_tab_to_h CP863 cp863
< $<
492 cp864.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP864.TXT
8bit_tab_to_h
493 .
/8bit_tab_to_h CP864 cp864
< $<
495 cp865.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP865.TXT
8bit_tab_to_h
496 .
/8bit_tab_to_h CP865 cp865
< $<
498 cp869.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MICSFT
/PC
/CP869.TXT
8bit_tab_to_h
499 .
/8bit_tab_to_h CP869 cp869
< $<
501 cp1125.h
: $(TABLESDIR
)/csets-new
/CP1125.TXT
8bit_tab_to_h
502 .
/8bit_tab_to_h CP1125 cp1125
< $<
505 jisx0213.h
: JISX0213.TXT cjk_tab_to_h
506 .
/cjk_tab_to_h JISX0213
:2004 jisx0213
< $< > $@
508 tds565.h
: $(TABLESDIR
)/recode-cvs
/TDS565.TXT
8bit_tab_to_h
509 (echo
'#'; cat
$<) | .
/8bit_tab_to_h TDS565 tds565
> $@
511 atarist.h
: $(TABLESDIR
)/unicode.org-mappings
/VENDORS
/MISC
/ATARIST.TXT
512 .
/8bit_tab_to_h
'Atari ST' atarist
< $< > $@
514 riscos1.h
: $(TABLESDIR
)/recode-cvs
/RISCOS-LATIN1.TXT
8bit_tab_to_h
515 (echo
'#'; cat
$<) | .
/8bit_tab_to_h RISCOS-LATIN1 riscos1
> $@
518 cjk_variants.h
: $(TABLESDIR
)/yasuoka
/UniVariants cjk_variants
519 .
/cjk_variants
< $< > $@
522 8bit_tab_to_h
: 8bit_tab_to_h.c
523 gcc
-O
-Wall
-g
$< -o
$@
525 cjk_tab_to_h
: cjk_tab_to_h.c
526 gcc
-O
-Wall
-g
$< -o
$@
528 cjk_variants
: cjk_variants.c
529 gcc
-O
-Wall
-g
$< -o
$@
533 rm -f
8bit_tab_to_h cjk_tab_to_h cjk_variants
$(ALL
) GBKext.TXT