4 * The Regents of the University of California. All rights reserved.
6 * This code is derived from software contributed to Berkeley by
7 * Paul Borman at Krystal Technologies.
9 * Redistribution and use in source and binary forms, with or without
10 * modification, are permitted provided that the following conditions
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in the
16 * documentation and/or other materials provided with the distribution.
17 * 3. All advertising materials mentioning features or use of this software
18 * must display the following acknowledgement:
19 * This product includes software developed by the University of
20 * California, Berkeley and its contributors.
21 * 4. Neither the name of the University nor the names of its contributors
22 * may be used to endorse or promote products derived from this software
23 * without specific prior written permission.
25 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
26 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
27 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
28 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
29 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
30 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
31 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
32 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
33 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
34 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
40 static char sccsid
[] = "@(#)yacc.y 8.1 (Berkeley) 6/6/93";
44 #include <sys/cdefs.h>
45 __FBSDID
("$FreeBSD$");
47 #include <arpa/inet.h>
61 static void *xmalloc
(unsigned int sz
);
62 static uint32_t *xlalloc
(unsigned int sz
);
63 void yyerror(const char *s
);
64 static uint32_t *xrelalloc
(uint32_t *old
, unsigned int sz
);
65 static void dump_tables
(void);
66 static void cleanout
(void);
68 const char *locale_file
= "<stdout>";
70 rune_map maplower
= { { 0 }, NULL
};
71 rune_map mapupper
= { { 0 }, NULL
};
72 rune_map types
= { { 0 }, NULL
};
74 _FileRuneLocale new_locale
= { "", "", {}, {}, {}, 0, 0, 0, 0 };
75 char *variable
= NULL
;
77 void set_map
(rune_map
*, rune_list
*, uint32_t);
78 void set_digitmap
(rune_map
*, rune_list
*);
79 void add_map
(rune_map
*, rune_list
*, uint32_t);
80 static void usage
(void);
119 entry
: ENCODING STRING
120 { if
(strcmp
($2, "NONE") &&
121 strcmp
($2, "ASCII") &&
122 strcmp
($2, "UTF-8") &&
125 strcmp
($2, "GB18030") &&
126 strcmp
($2, "GB2312") &&
127 strcmp
($2, "BIG5") &&
128 strcmp
($2, "MSKanji"))
129 warnx
("ENCODING %s is not supported by libc", $2);
130 strncpy
(new_locale.encoding
, $2,
131 sizeof
(new_locale.encoding
)); }
133 { new_locale.variable_len
= strlen
($1) + 1;
134 variable
= xmalloc
(new_locale.variable_len
);
135 strcpy
(variable
, $1);
138 { warnx
("the INVALID keyword is deprecated"); }
140 { set_map
(&types
, $2, $1); }
142 { set_map
(&maplower
, $2, 0); }
144 { set_map
(&mapupper
, $2, 0); }
146 { set_digitmap
(&types
, $2); }
151 $$
= (rune_list
*)xmalloc
(sizeof
(rune_list
));
158 $$
= (rune_list
*)xmalloc
(sizeof
(rune_list
));
165 $$
= (rune_list
*)xmalloc
(sizeof
(rune_list
));
170 | list RUNE THRU RUNE
172 $$
= (rune_list
*)xmalloc
(sizeof
(rune_list
));
179 map
: LBRK RUNE RUNE RBRK
181 $$
= (rune_list
*)xmalloc
(sizeof
(rune_list
));
187 | map LBRK RUNE RUNE RBRK
189 $$
= (rune_list
*)xmalloc
(sizeof
(rune_list
));
195 | LBRK RUNE THRU RUNE
':' RUNE RBRK
197 $$
= (rune_list
*)xmalloc
(sizeof
(rune_list
));
203 | map LBRK RUNE THRU RUNE
':' RUNE RBRK
205 $$
= (rune_list
*)xmalloc
(sizeof
(rune_list
));
225 main
(int ac
, char *av
[])
231 while
((x
= getopt
(ac
, av
, "do:")) != -1) {
237 locale_file
= optarg
;
238 if
((fp
= fopen
(locale_file
, "w")) == NULL
)
239 err
(1, "%s", locale_file
);
247 switch
(ac
- optind
) {
251 if
(freopen
(av
[optind
], "r", stdin
) == 0)
252 err
(1, "%s", av
[optind
]);
257 for
(x
= 0; x
< _CACHED_RUNES
; ++x
) {
261 memcpy
(new_locale.magic
, _FILE_RUNE_MAGIC_1
, sizeof
(new_locale.magic
));
271 fprintf
(stderr
, "usage: mklocale [-d] [-o output] [source]\n");
279 fprintf
(stderr
, "%s\n", s
);
286 void *r
= malloc
(sz
);
296 uint32_t *r
= (uint32_t *)malloc
(sz
* sizeof
(uint32_t));
307 uint32_t *r
= (uint32_t *)realloc
((char *)old
,
308 sz
* sizeof
(uint32_t));
310 errx
(1, "xrelalloc");
315 set_map
(map
, list
, flag
)
321 rune_list
*nlist
= list
->next
;
322 add_map
(map
, list
, flag
);
328 set_digitmap
(map
, list
)
335 rune_list
*nlist
= list
->next
;
336 for
(i
= list
->min
; i
<= list
->max
; ++i
) {
337 if
(list
->map
+ (i
- list
->min
)) {
338 rune_list
*tmp
= (rune_list
*)xmalloc
(sizeof
(rune_list
));
341 add_map
(map
, tmp
, list
->map
+ (i
- list
->min
));
350 add_map
(map
, list
, flag
)
360 while
(list
->min
< _CACHED_RUNES
&& list
->min
<= list
->max
) {
362 map
->map
[list
->min
++] |
= flag
;
364 map
->map
[list
->min
++] = list
->map
++;
367 if
(list
->min
> list
->max
) {
372 run
= list
->max
- list
->min
+ 1;
374 if
(!(r
= map
->root
) ||
(list
->max
< r
->min
- 1)
375 ||
(!flag
&& list
->max
== r
->min
- 1)) {
377 list
->types
= xlalloc
(run
);
378 for
(i
= 0; i
< run
; ++i
)
379 list
->types
[i
] = flag
;
381 list
->next
= map
->root
;
386 for
(r
= map
->root
; r
&& r
->max
+ 1 < list
->min
; r
= r
->next
)
391 * We are off the end.
394 list
->types
= xlalloc
(run
);
395 for
(i
= 0; i
< run
; ++i
)
396 list
->types
[i
] = flag
;
403 if
(list
->max
< r
->min
- 1) {
405 * We come before this range and we do not intersect it.
406 * We are not before the root node, it was checked before the loop
409 list
->types
= xlalloc
(run
);
410 for
(i
= 0; i
< run
; ++i
)
411 list
->types
[i
] = flag
;
413 list
->next
= lr
->next
;
419 * At this point we have found that we at least intersect with
420 * the range pointed to by `r', we might intersect with one or
421 * more ranges beyond `r' as well.
424 if
(!flag
&& list
->map
- list
->min
!= r
->map
- r
->min
) {
426 * There are only two cases when we are doing case maps and
427 * our maps needn't have the same offset. When we are adjoining
428 * but not intersecting.
430 if
(list
->max
+ 1 == r
->min
) {
435 if
(list
->min
- 1 == r
->max
) {
436 list
->next
= r
->next
;
440 errx
(1, "error: conflicting map entries");
443 if
(list
->min
>= r
->min
&& list
->max
<= r
->max
) {
449 for
(i
= list
->min
; i
<= list
->max
; ++i
)
450 r
->types
[i
- r
->min
] |
= flag
;
455 if
(list
->min
<= r
->min
&& list
->max
>= r
->max
) {
457 * Superset case. Make him big enough to hold us.
458 * We might need to merge with the guy after him.
461 list
->types
= xlalloc
(list
->max
- list
->min
+ 1);
463 for
(i
= list
->min
; i
<= list
->max
; ++i
)
464 list
->types
[i
- list
->min
] = flag
;
466 for
(i
= r
->min
; i
<= r
->max
; ++i
)
467 list
->types
[i
- list
->min
] |
= r
->types
[i
- r
->min
];
470 r
->types
= list
->types
;
477 } else if
(list
->min
< r
->min
) {
479 * Our tail intersects his head.
482 list
->types
= xlalloc
(r
->max
- list
->min
+ 1);
484 for
(i
= r
->min
; i
<= r
->max
; ++i
)
485 list
->types
[i
- list
->min
] = r
->types
[i
- r
->min
];
487 for
(i
= list
->min
; i
< r
->min
; ++i
)
488 list
->types
[i
- list
->min
] = flag
;
490 for
(i
= r
->min
; i
<= list
->max
; ++i
)
491 list
->types
[i
- list
->min
] |
= flag
;
494 r
->types
= list
->types
;
503 * Our head intersects his tail.
504 * We might need to merge with the guy after him.
507 r
->types
= xrelalloc
(r
->types
, list
->max
- r
->min
+ 1);
509 for
(i
= list
->min
; i
<= r
->max
; ++i
)
510 r
->types
[i
- r
->min
] |
= flag
;
512 for
(i
= r
->max
+1; i
<= list
->max
; ++i
)
513 r
->types
[i
- r
->min
] = flag
;
520 * Okay, check to see if we grew into the next guy(s)
522 while
((lr
= r
->next
) && r
->max
>= lr
->min
) {
524 if
(r
->max
>= lr
->max
) {
526 * Good, we consumed all of him.
528 for
(i
= lr
->min
; i
<= lr
->max
; ++i
)
529 r
->types
[i
- r
->min
] |
= lr
->types
[i
- lr
->min
];
532 * "append" him on to the end of us.
534 r
->types
= xrelalloc
(r
->types
, lr
->max
- r
->min
+ 1);
536 for
(i
= lr
->min
; i
<= r
->max
; ++i
)
537 r
->types
[i
- r
->min
] |
= lr
->types
[i
- lr
->min
];
539 for
(i
= r
->max
+1; i
<= lr
->max
; ++i
)
540 r
->types
[i
- r
->min
] = lr
->types
[i
- lr
->min
];
545 if
(lr
->max
> r
->max
)
560 int x
, first_d
, curr_d
;
564 * See if we can compress some of the istype arrays
566 for
(list
= types.root
; list
; list
= list
->next
) {
567 list
->map
= list
->types
[0];
568 for
(x
= 1; x
< list
->max
- list
->min
+ 1; ++x
) {
569 if
((int32_t)list
->types
[x
] != list
->map
) {
576 first_d
= curr_d
= -1;
577 for
(x
= 0; x
< _CACHED_RUNES
; ++x
) {
578 uint32_t r
= types.map
[x
];
582 first_d
= curr_d
= x
;
583 else if
(x
!= curr_d
+ 1)
584 errx
(1, "error: DIGIT range is not contiguous");
585 else if
(x
- first_d
> 9)
586 errx
(1, "error: DIGIT range is too big");
591 "error: DIGIT range is not a subset of XDIGIT range");
595 errx
(1, "error: no DIGIT range defined in the single byte area");
596 else if
(curr_d
- first_d
< 9)
597 errx
(1, "error: DIGIT range is too small in the single byte area");
600 * Fill in our tables. Do this in network order so that
601 * diverse machines have a chance of sharing data.
602 * (Machines like Crays cannot share with little machines due to
603 * word size. Sigh. We tried.)
605 for
(x
= 0; x
< _CACHED_RUNES
; ++x
) {
606 new_locale.runetype
[x
] = htonl
(types.map
[x
]);
607 new_locale.maplower
[x
] = htonl
(maplower.map
[x
]);
608 new_locale.mapupper
[x
] = htonl
(mapupper.map
[x
]);
612 * Count up how many ranges we will need for each of the extents.
617 new_locale.runetype_ext_nranges
++;
620 new_locale.runetype_ext_nranges
=
621 htonl
(new_locale.runetype_ext_nranges
);
623 list
= maplower.root
;
626 new_locale.maplower_ext_nranges
++;
629 new_locale.maplower_ext_nranges
=
630 htonl
(new_locale.maplower_ext_nranges
);
632 list
= mapupper.root
;
635 new_locale.mapupper_ext_nranges
++;
638 new_locale.mapupper_ext_nranges
=
639 htonl
(new_locale.mapupper_ext_nranges
);
641 new_locale.variable_len
= htonl
(new_locale.variable_len
);
644 * Okay, we are now ready to write the new locale file.
648 * PART 1: The _FileRuneLocale structure
650 if
(fwrite
((char *)&new_locale
, sizeof
(new_locale
), 1, fp
) != 1) {
655 * PART 2: The runetype_ext structures (not the actual tables)
662 re.min
= htonl
(list
->min
);
663 re.max
= htonl
(list
->max
);
664 re.map
= htonl
(list
->map
);
666 if
(fwrite
((char *)&re
, sizeof
(re
), 1, fp
) != 1) {
674 * PART 3: The maplower_ext structures
676 list
= maplower.root
;
681 re.min
= htonl
(list
->min
);
682 re.max
= htonl
(list
->max
);
683 re.map
= htonl
(list
->map
);
685 if
(fwrite
((char *)&re
, sizeof
(re
), 1, fp
) != 1) {
693 * PART 4: The mapupper_ext structures
695 list
= mapupper.root
;
700 re.min
= htonl
(list
->min
);
701 re.max
= htonl
(list
->max
);
702 re.map
= htonl
(list
->map
);
704 if
(fwrite
((char *)&re
, sizeof
(re
), 1, fp
) != 1) {
712 * PART 5: The runetype_ext tables
717 for
(x
= 0; x
< list
->max
- list
->min
+ 1; ++x
)
718 list
->types
[x
] = htonl
(list
->types
[x
]);
721 if
(fwrite
((char *)list
->types
,
722 (list
->max
- list
->min
+ 1) * sizeof
(uint32_t),
731 * PART 6: And finally the variable data
734 ntohl
(new_locale.variable_len
), 1, fp
) != 1) {
738 if
(fclose
(fp
) != 0) {
747 if
(new_locale.encoding
[0])
748 fprintf
(stderr
, "ENCODING %s\n", new_locale.encoding
);
750 fprintf
(stderr
, "VARIABLE %s\n", variable
);
752 fprintf
(stderr
, "\nMAPLOWER:\n\n");
754 for
(x
= 0; x
< _CACHED_RUNES
; ++x
) {
755 if
(isprint
(maplower.map
[x
]))
756 fprintf
(stderr
, " '%c'", (int)maplower.map
[x
]);
757 else if
(maplower.map
[x
])
758 fprintf
(stderr
, "%04x", maplower.map
[x
]);
760 fprintf
(stderr
, "%4x", 0);
761 if
((x
& 0xf) == 0xf)
762 fprintf
(stderr
, "\n");
764 fprintf
(stderr
, " ");
766 fprintf
(stderr
, "\n");
768 for
(list
= maplower.root
; list
; list
= list
->next
)
769 fprintf
(stderr
, "\t%04x - %04x : %04x\n", list
->min
, list
->max
, list
->map
);
771 fprintf
(stderr
, "\nMAPUPPER:\n\n");
773 for
(x
= 0; x
< _CACHED_RUNES
; ++x
) {
774 if
(isprint
(mapupper.map
[x
]))
775 fprintf
(stderr
, " '%c'", (int)mapupper.map
[x
]);
776 else if
(mapupper.map
[x
])
777 fprintf
(stderr
, "%04x", mapupper.map
[x
]);
779 fprintf
(stderr
, "%4x", 0);
780 if
((x
& 0xf) == 0xf)
781 fprintf
(stderr
, "\n");
783 fprintf
(stderr
, " ");
785 fprintf
(stderr
, "\n");
787 for
(list
= mapupper.root
; list
; list
= list
->next
)
788 fprintf
(stderr
, "\t%04x - %04x : %04x\n", list
->min
, list
->max
, list
->map
);
791 fprintf
(stderr
, "\nTYPES:\n\n");
793 for
(x
= 0; x
< _CACHED_RUNES
; ++x
) {
794 uint32_t r
= types.map
[x
];
798 fprintf
(stderr
, " '%c': %2d", x
, (int)(r
& 0xff));
800 fprintf
(stderr
, "%04x: %2d", x
, (int)(r
& 0xff));
802 fprintf
(stderr
, " %4s", (r
& _CTYPE_A
) ?
"alph" : "");
803 fprintf
(stderr
, " %4s", (r
& _CTYPE_C
) ?
"ctrl" : "");
804 fprintf
(stderr
, " %4s", (r
& _CTYPE_D
) ?
"dig" : "");
805 fprintf
(stderr
, " %4s", (r
& _CTYPE_G
) ?
"graf" : "");
806 fprintf
(stderr
, " %4s", (r
& _CTYPE_L
) ?
"low" : "");
807 fprintf
(stderr
, " %4s", (r
& _CTYPE_P
) ?
"punc" : "");
808 fprintf
(stderr
, " %4s", (r
& _CTYPE_S
) ?
"spac" : "");
809 fprintf
(stderr
, " %4s", (r
& _CTYPE_U
) ?
"upp" : "");
810 fprintf
(stderr
, " %4s", (r
& _CTYPE_X
) ?
"xdig" : "");
811 fprintf
(stderr
, " %4s", (r
& _CTYPE_B
) ?
"blnk" : "");
812 fprintf
(stderr
, " %4s", (r
& _CTYPE_R
) ?
"prnt" : "");
813 fprintf
(stderr
, " %4s", (r
& _CTYPE_I
) ?
"ideo" : "");
814 fprintf
(stderr
, " %4s", (r
& _CTYPE_T
) ?
"spec" : "");
815 fprintf
(stderr
, " %4s", (r
& _CTYPE_Q
) ?
"phon" : "");
816 fprintf
(stderr
, "\n");
820 for
(list
= types.root
; list
; list
= list
->next
) {
821 if
(list
->map
&& list
->min
+ 3 < list
->max
) {
822 uint32_t r
= list
->map
;
824 fprintf
(stderr
, "%04x: %2d",
825 (uint32_t)list
->min
, (int)(r
& 0xff));
827 fprintf
(stderr
, " %4s", (r
& _CTYPE_A
) ?
"alph" : "");
828 fprintf
(stderr
, " %4s", (r
& _CTYPE_C
) ?
"ctrl" : "");
829 fprintf
(stderr
, " %4s", (r
& _CTYPE_D
) ?
"dig" : "");
830 fprintf
(stderr
, " %4s", (r
& _CTYPE_G
) ?
"graf" : "");
831 fprintf
(stderr
, " %4s", (r
& _CTYPE_L
) ?
"low" : "");
832 fprintf
(stderr
, " %4s", (r
& _CTYPE_P
) ?
"punc" : "");
833 fprintf
(stderr
, " %4s", (r
& _CTYPE_S
) ?
"spac" : "");
834 fprintf
(stderr
, " %4s", (r
& _CTYPE_U
) ?
"upp" : "");
835 fprintf
(stderr
, " %4s", (r
& _CTYPE_X
) ?
"xdig" : "");
836 fprintf
(stderr
, " %4s", (r
& _CTYPE_B
) ?
"blnk" : "");
837 fprintf
(stderr
, " %4s", (r
& _CTYPE_R
) ?
"prnt" : "");
838 fprintf
(stderr
, " %4s", (r
& _CTYPE_I
) ?
"ideo" : "");
839 fprintf
(stderr
, " %4s", (r
& _CTYPE_T
) ?
"spec" : "");
840 fprintf
(stderr
, " %4s", (r
& _CTYPE_Q
) ?
"phon" : "");
841 fprintf
(stderr
, "\n...\n");
843 fprintf
(stderr
, "%04x: %2d",
844 (uint32_t)list
->max
, (int)(r
& 0xff));
846 fprintf
(stderr
, " %4s", (r
& _CTYPE_A
) ?
"alph" : "");
847 fprintf
(stderr
, " %4s", (r
& _CTYPE_C
) ?
"ctrl" : "");
848 fprintf
(stderr
, " %4s", (r
& _CTYPE_D
) ?
"dig" : "");
849 fprintf
(stderr
, " %4s", (r
& _CTYPE_G
) ?
"graf" : "");
850 fprintf
(stderr
, " %4s", (r
& _CTYPE_L
) ?
"low" : "");
851 fprintf
(stderr
, " %4s", (r
& _CTYPE_P
) ?
"punc" : "");
852 fprintf
(stderr
, " %4s", (r
& _CTYPE_S
) ?
"spac" : "");
853 fprintf
(stderr
, " %4s", (r
& _CTYPE_U
) ?
"upp" : "");
854 fprintf
(stderr
, " %4s", (r
& _CTYPE_X
) ?
"xdig" : "");
855 fprintf
(stderr
, " %4s", (r
& _CTYPE_B
) ?
"blnk" : "");
856 fprintf
(stderr
, " %4s", (r
& _CTYPE_R
) ?
"prnt" : "");
857 fprintf
(stderr
, " %4s", (r
& _CTYPE_I
) ?
"ideo" : "");
858 fprintf
(stderr
, " %4s", (r
& _CTYPE_T
) ?
"spec" : "");
859 fprintf
(stderr
, " %4s", (r
& _CTYPE_Q
) ?
"phon" : "");
860 fprintf
(stderr
, "\n");
862 for
(x
= list
->min
; x
<= list
->max
; ++x
) {
863 uint32_t r
= ntohl
(list
->types
[x
- list
->min
]);
866 fprintf
(stderr
, "%04x: %2d", x
, (int)(r
& 0xff));
868 fprintf
(stderr
, " %4s", (r
& _CTYPE_A
) ?
"alph" : "");
869 fprintf
(stderr
, " %4s", (r
& _CTYPE_C
) ?
"ctrl" : "");
870 fprintf
(stderr
, " %4s", (r
& _CTYPE_D
) ?
"dig" : "");
871 fprintf
(stderr
, " %4s", (r
& _CTYPE_G
) ?
"graf" : "");
872 fprintf
(stderr
, " %4s", (r
& _CTYPE_L
) ?
"low" : "");
873 fprintf
(stderr
, " %4s", (r
& _CTYPE_P
) ?
"punc" : "");
874 fprintf
(stderr
, " %4s", (r
& _CTYPE_S
) ?
"spac" : "");
875 fprintf
(stderr
, " %4s", (r
& _CTYPE_U
) ?
"upp" : "");
876 fprintf
(stderr
, " %4s", (r
& _CTYPE_X
) ?
"xdig" : "");
877 fprintf
(stderr
, " %4s", (r
& _CTYPE_B
) ?
"blnk" : "");
878 fprintf
(stderr
, " %4s", (r
& _CTYPE_R
) ?
"prnt" : "");
879 fprintf
(stderr
, " %4s", (r
& _CTYPE_I
) ?
"ideo" : "");
880 fprintf
(stderr
, " %4s", (r
& _CTYPE_T
) ?
"spec" : "");
881 fprintf
(stderr
, " %4s", (r
& _CTYPE_Q
) ?
"phon" : "");
882 fprintf
(stderr
, "\n");