4 Copyright (C) 2007-2024
5 Free Software Foundation, Inc.
10 This file is part of the Midnight Commander.
12 The Midnight Commander is free software: you can redistribute it
13 and/or modify it under the terms of the GNU General Public License as
14 published by the Free Software Foundation, either version 3 of the License,
15 or (at your option) any later version.
17 The Midnight Commander is distributed in the hope that it will be useful,
18 but WITHOUT ANY WARRANTY; without even the implied warranty of
19 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
20 GNU General Public License for more details.
22 You should have received a copy of the GNU General Public License
23 along with this program. If not, see <http://www.gnu.org/licenses/>.
31 #include "lib/global.h"
32 #include "lib/strutil.h"
34 /* Functions for singlebyte encodings, all characters have width 1
35 * using standard system functions.
36 * There are only small differences between functions in strutil8bit.c
40 /*** global variables ****************************************************************************/
42 /*** file scope macro definitions ****************************************************************/
45 * Inlines to equalize 'char' signedness for single 'char' encodings.
47 * isspace ((unsigned char) c);
51 #define DECLARE_CTYPE_WRAPPER(func_name) \
52 static inline int char_##func_name(char c) \
54 return func_name((int)(unsigned char)c); \
57 /*** file scope type declarations ****************************************************************/
59 /*** forward declarations (file scope functions) *************************************************/
61 /*** file scope variables ************************************************************************/
63 static const char replch
= '?';
65 /* --------------------------------------------------------------------------------------------- */
66 /*** file scope functions ************************************************************************/
67 /* --------------------------------------------------------------------------------------------- */
70 DECLARE_CTYPE_WRAPPER (isalnum
)
71 DECLARE_CTYPE_WRAPPER (isdigit
)
72 DECLARE_CTYPE_WRAPPER (isprint
)
73 DECLARE_CTYPE_WRAPPER (ispunct
)
74 DECLARE_CTYPE_WRAPPER (isspace
)
75 DECLARE_CTYPE_WRAPPER (toupper
)
76 DECLARE_CTYPE_WRAPPER (tolower
)
79 /* --------------------------------------------------------------------------------------------- */
82 str_8bit_insert_replace_char (GString
*buffer
)
84 g_string_append_c (buffer
, replch
);
87 /* --------------------------------------------------------------------------------------------- */
90 str_8bit_is_valid_string (const char *text
)
96 /* --------------------------------------------------------------------------------------------- */
99 str_8bit_is_valid_char (const char *ch
, size_t size
)
106 /* --------------------------------------------------------------------------------------------- */
109 str_8bit_cnext_char (const char **text
)
114 /* --------------------------------------------------------------------------------------------- */
117 str_8bit_cprev_char (const char **text
)
122 /* --------------------------------------------------------------------------------------------- */
125 str_8bit_cnext_noncomb_char (const char **text
)
127 if (*text
[0] == '\0')
134 /* --------------------------------------------------------------------------------------------- */
137 str_8bit_cprev_noncomb_char (const char **text
, const char *begin
)
139 if ((*text
) == begin
)
146 /* --------------------------------------------------------------------------------------------- */
149 str_8bit_isspace (const char *text
)
151 return char_isspace (text
[0]) != 0;
154 /* --------------------------------------------------------------------------------------------- */
157 str_8bit_ispunct (const char *text
)
159 return char_ispunct (text
[0]) != 0;
162 /* --------------------------------------------------------------------------------------------- */
165 str_8bit_isalnum (const char *text
)
167 return char_isalnum (text
[0]) != 0;
170 /* --------------------------------------------------------------------------------------------- */
173 str_8bit_isdigit (const char *text
)
175 return char_isdigit (text
[0]) != 0;
178 /* --------------------------------------------------------------------------------------------- */
181 str_8bit_isprint (const char *text
)
183 return char_isprint (text
[0]) != 0;
186 /* --------------------------------------------------------------------------------------------- */
189 str_8bit_iscombiningmark (const char *text
)
195 /* --------------------------------------------------------------------------------------------- */
198 str_8bit_toupper (const char *text
, char **out
, size_t *remain
)
203 (*out
)[0] = char_toupper (text
[0]);
209 /* --------------------------------------------------------------------------------------------- */
212 str_8bit_tolower (const char *text
, char **out
, size_t *remain
)
217 (*out
)[0] = char_tolower (text
[0]);
223 /* --------------------------------------------------------------------------------------------- */
226 str_8bit_length (const char *text
)
228 return strlen (text
);
231 /* --------------------------------------------------------------------------------------------- */
234 str_8bit_length2 (const char *text
, int size
)
238 length
= strlen (text
);
240 return (size
>= 0) ? MIN (length
, (size_t) size
) : length
;
243 /* --------------------------------------------------------------------------------------------- */
246 str_8bit_conv_gerror_message (GError
*mcerror
, const char *def_msg
)
251 /* glib messages are in UTF-8 charset */
252 conv
= str_crt_conv_from ("UTF-8");
254 if (conv
== INVALID_CONV
)
255 ret
= g_strdup (def_msg
!= NULL
? def_msg
: "");
260 buf
= g_string_new ("");
262 if (str_convert (conv
, mcerror
->message
, buf
) != ESTR_FAILURE
)
263 ret
= g_string_free (buf
, FALSE
);
266 ret
= g_strdup (def_msg
!= NULL
? def_msg
: "");
267 g_string_free (buf
, TRUE
);
270 str_close_conv (conv
);
276 /* --------------------------------------------------------------------------------------------- */
279 str_8bit_vfs_convert_to (GIConv coder
, const char *string
, int size
, GString
*buffer
)
281 estr_t result
= ESTR_SUCCESS
;
283 if (coder
== str_cnv_not_convert
)
284 g_string_append_len (buffer
, string
, size
);
286 result
= str_nconvert (coder
, string
, size
, buffer
);
291 /* --------------------------------------------------------------------------------------------- */
294 str_8bit_term_form (const char *text
)
296 static char result
[BUF_MEDIUM
];
303 remain
= sizeof (result
);
304 length
= strlen (text
);
306 for (; pos
< length
&& remain
> 1; pos
++, actual
++, remain
--)
307 actual
[0] = char_isprint (text
[pos
]) ? text
[pos
] : '.';
313 /* --------------------------------------------------------------------------------------------- */
316 str_8bit_fit_to_term (const char *text
, int width
, align_crt_t just_mode
)
318 static char result
[BUF_MEDIUM
];
325 length
= strlen (text
);
327 remain
= sizeof (result
);
329 if ((int) length
<= width
)
331 switch (HIDE_FIT (just_mode
))
335 ident
= (width
- length
) / 2;
338 ident
= width
- length
;
344 if ((int) remain
<= ident
)
346 memset (actual
, ' ', ident
);
350 for (; pos
< length
&& remain
> 1; pos
++, actual
++, remain
--)
351 actual
[0] = char_isprint (text
[pos
]) ? text
[pos
] : '.';
353 if (width
- length
- ident
> 0)
355 if (remain
<= width
- length
- ident
)
357 memset (actual
, ' ', width
- length
- ident
);
358 actual
+= width
- length
- ident
;
361 else if (IS_FIT (just_mode
))
363 for (; pos
+ 1 <= (gsize
) width
/ 2 && remain
> 1; actual
++, pos
++, remain
--)
364 actual
[0] = char_isprint (text
[pos
]) ? text
[pos
] : '.';
372 pos
+= length
- width
+ 1;
373 for (; pos
< length
&& remain
> 1; pos
++, actual
++, remain
--)
374 actual
[0] = char_isprint (text
[pos
]) ? text
[pos
] : '.';
378 switch (HIDE_FIT (just_mode
))
381 ident
= (length
- width
) / 2;
384 ident
= length
- width
;
391 for (; pos
< (gsize
) (ident
+ width
) && remain
> 1; pos
++, actual
++, remain
--)
392 actual
[0] = char_isprint (text
[pos
]) ? text
[pos
] : '.';
396 if (actual
>= result
+ sizeof (result
))
397 actual
= result
+ sizeof (result
) - 1;
402 /* --------------------------------------------------------------------------------------------- */
405 str_8bit_term_trim (const char *text
, int width
)
407 static char result
[BUF_MEDIUM
];
412 length
= strlen (text
);
414 remain
= sizeof (result
);
420 if (width
>= (int) length
)
422 for (pos
= 0; pos
< length
&& remain
> 1; pos
++, actual
++, remain
--)
423 actual
[0] = char_isprint (text
[pos
]) ? text
[pos
] : '.';
427 memset (actual
, '.', width
);
432 memset (actual
, '.', 3);
436 for (pos
= length
- width
+ 3; pos
< length
&& remain
> 1; pos
++, actual
++, remain
--)
437 actual
[0] = char_isprint (text
[pos
]) ? text
[pos
] : '.';
445 /* --------------------------------------------------------------------------------------------- */
448 str_8bit_term_width2 (const char *text
, size_t length
)
452 text_len
= strlen (text
);
454 return (length
!= (size_t) (-1)) ? MIN (text_len
, length
) : text_len
;
457 /* --------------------------------------------------------------------------------------------- */
460 str_8bit_term_width1 (const char *text
)
462 return str_8bit_term_width2 (text
, (size_t) (-1));
465 /* --------------------------------------------------------------------------------------------- */
468 str_8bit_term_char_width (const char *text
)
474 /* --------------------------------------------------------------------------------------------- */
477 str_8bit_term_substring (const char *text
, int start
, int width
)
479 static char result
[BUF_MEDIUM
];
485 remain
= sizeof (result
);
486 length
= strlen (text
);
488 if (start
< (int) length
)
492 for (pos
= start
; pos
< length
&& width
> 0 && remain
> 1;
493 pos
++, width
--, actual
++, remain
--)
494 actual
[0] = char_isprint (text
[pos
]) ? text
[pos
] : '.';
497 for (; width
> 0 && remain
> 1; actual
++, remain
--, width
--)
504 /* --------------------------------------------------------------------------------------------- */
507 str_8bit_trunc (const char *text
, int width
)
509 static char result
[MC_MAXPATHLEN
];
516 remain
= sizeof (result
);
517 length
= strlen (text
);
519 if ((int) length
> width
)
521 for (; pos
+ 1 <= (gsize
) width
/ 2 && remain
> 1; actual
++, pos
++, remain
--)
522 actual
[0] = char_isprint (text
[pos
]) ? text
[pos
] : '.';
530 pos
+= length
- width
+ 1;
531 for (; pos
< length
&& remain
> 1; pos
++, actual
++, remain
--)
532 actual
[0] = char_isprint (text
[pos
]) ? text
[pos
] : '.';
536 for (; pos
< length
&& remain
> 1; pos
++, actual
++, remain
--)
537 actual
[0] = char_isprint (text
[pos
]) ? text
[pos
] : '.';
545 /* --------------------------------------------------------------------------------------------- */
548 str_8bit_offset_to_pos (const char *text
, size_t length
)
554 /* --------------------------------------------------------------------------------------------- */
557 str_8bit_column_to_pos (const char *text
, size_t pos
)
563 /* --------------------------------------------------------------------------------------------- */
566 str_8bit_create_search_needle (const char *needle
, gboolean case_sen
)
569 return (char *) needle
;
572 /* --------------------------------------------------------------------------------------------- */
575 str_8bit_release_search_needle (char *needle
, gboolean case_sen
)
581 /* --------------------------------------------------------------------------------------------- */
584 str_8bit_strdown (const char *str
)
591 rets
= g_strdup (str
);
593 for (p
= rets
; *p
!= '\0'; p
++)
594 *p
= char_tolower (*p
);
599 /* --------------------------------------------------------------------------------------------- */
602 str_8bit_search_first (const char *text
, const char *search
, gboolean case_sen
)
608 fold_text
= case_sen
? (char *) text
: str_8bit_strdown (text
);
609 fold_search
= case_sen
? (char *) search
: str_8bit_strdown (search
);
611 match
= g_strstr_len (fold_text
, -1, fold_search
);
616 offset
= match
- fold_text
;
617 match
= text
+ offset
;
623 g_free (fold_search
);
629 /* --------------------------------------------------------------------------------------------- */
632 str_8bit_search_last (const char *text
, const char *search
, gboolean case_sen
)
638 fold_text
= case_sen
? (char *) text
: str_8bit_strdown (text
);
639 fold_search
= case_sen
? (char *) search
: str_8bit_strdown (search
);
641 match
= g_strrstr_len (fold_text
, -1, fold_search
);
646 offset
= match
- fold_text
;
647 match
= text
+ offset
;
653 g_free (fold_search
);
659 /* --------------------------------------------------------------------------------------------- */
662 str_8bit_compare (const char *t1
, const char *t2
)
664 return strcmp (t1
, t2
);
667 /* --------------------------------------------------------------------------------------------- */
670 str_8bit_ncompare (const char *t1
, const char *t2
)
677 return strncmp (t1
, t2
, MIN (l1
, l2
));
680 /* --------------------------------------------------------------------------------------------- */
683 str_8bit_casecmp (const char *s1
, const char *s2
)
687 #ifdef HAVE_STRCASECMP
688 g_return_val_if_fail (s1
!= NULL
, 0);
689 g_return_val_if_fail (s2
!= NULL
, 0);
691 return strcasecmp (s1
, s2
);
694 g_return_val_if_fail (s1
!= NULL
, 0);
695 g_return_val_if_fail (s2
!= NULL
, 0);
697 for (; *s1
!= '\0' && *s2
!= '\0'; s1
++, s2
++)
701 /* According to A. Cox, some platforms have islower's that
702 * don't work right on non-uppercase
704 c1
= isupper ((guchar
) * s1
) ? tolower ((guchar
) * s1
) : *s1
;
705 c2
= isupper ((guchar
) * s2
) ? tolower ((guchar
) * s2
) : *s2
;
710 return (((gint
) (guchar
) * s1
) - ((gint
) (guchar
) * s2
));
714 /* --------------------------------------------------------------------------------------------- */
717 str_8bit_ncasecmp (const char *s1
, const char *s2
)
722 g_return_val_if_fail (s1
!= NULL
, 0);
723 g_return_val_if_fail (s2
!= NULL
, 0);
731 #ifdef HAVE_STRNCASECMP
732 return strncasecmp (s1
, s2
, n
);
735 for (; *s1
!= '\0' && *s2
!= '\0'; s1
++, s2
++)
740 /* According to A. Cox, some platforms have islower's that
741 * don't work right on non-uppercase
743 c1
= isupper ((guchar
) * s1
) ? tolower ((guchar
) * s1
) : *s1
;
744 c2
= isupper ((guchar
) * s2
) ? tolower ((guchar
) * s2
) : *s2
;
752 return (((gint
) (guchar
) * s1
) - ((gint
) (guchar
) * s2
));
757 /* --------------------------------------------------------------------------------------------- */
760 str_8bit_prefix (const char *text
, const char *prefix
)
764 for (result
= 0; text
[result
] != '\0' && prefix
[result
] != '\0'
765 && text
[result
] == prefix
[result
]; result
++);
770 /* --------------------------------------------------------------------------------------------- */
773 str_8bit_caseprefix (const char *text
, const char *prefix
)
777 for (result
= 0; text
[result
] != '\0' && prefix
[result
] != '\0'
778 && char_toupper (text
[result
]) == char_toupper (prefix
[result
]); result
++);
783 /* --------------------------------------------------------------------------------------------- */
786 str_8bit_fix_string (char *text
)
791 /* --------------------------------------------------------------------------------------------- */
794 str_8bit_create_key (const char *text
, gboolean case_sen
)
796 return case_sen
? (char *) text
: str_8bit_strdown (text
);
799 /* --------------------------------------------------------------------------------------------- */
802 str_8bit_key_collate (const char *t1
, const char *t2
, gboolean case_sen
)
804 return case_sen
? strcmp (t1
, t2
) : strcoll (t1
, t2
);
807 /* --------------------------------------------------------------------------------------------- */
810 str_8bit_release_key (char *key
, gboolean case_sen
)
816 /* --------------------------------------------------------------------------------------------- */
817 /*** public functions ****************************************************************************/
818 /* --------------------------------------------------------------------------------------------- */
823 struct str_class result
;
825 result
.conv_gerror_message
= str_8bit_conv_gerror_message
;
826 result
.vfs_convert_to
= str_8bit_vfs_convert_to
;
827 result
.insert_replace_char
= str_8bit_insert_replace_char
;
828 result
.is_valid_string
= str_8bit_is_valid_string
;
829 result
.is_valid_char
= str_8bit_is_valid_char
;
830 result
.cnext_char
= str_8bit_cnext_char
;
831 result
.cprev_char
= str_8bit_cprev_char
;
832 result
.cnext_char_safe
= str_8bit_cnext_char
;
833 result
.cprev_char_safe
= str_8bit_cprev_char
;
834 result
.cnext_noncomb_char
= str_8bit_cnext_noncomb_char
;
835 result
.cprev_noncomb_char
= str_8bit_cprev_noncomb_char
;
836 result
.char_isspace
= str_8bit_isspace
;
837 result
.char_ispunct
= str_8bit_ispunct
;
838 result
.char_isalnum
= str_8bit_isalnum
;
839 result
.char_isdigit
= str_8bit_isdigit
;
840 result
.char_isprint
= str_8bit_isprint
;
841 result
.char_iscombiningmark
= str_8bit_iscombiningmark
;
842 result
.char_toupper
= str_8bit_toupper
;
843 result
.char_tolower
= str_8bit_tolower
;
844 result
.length
= str_8bit_length
;
845 result
.length2
= str_8bit_length2
;
846 result
.length_noncomb
= str_8bit_length
;
847 result
.fix_string
= str_8bit_fix_string
;
848 result
.term_form
= str_8bit_term_form
;
849 result
.fit_to_term
= str_8bit_fit_to_term
;
850 result
.term_trim
= str_8bit_term_trim
;
851 result
.term_width2
= str_8bit_term_width2
;
852 result
.term_width1
= str_8bit_term_width1
;
853 result
.term_char_width
= str_8bit_term_char_width
;
854 result
.term_substring
= str_8bit_term_substring
;
855 result
.trunc
= str_8bit_trunc
;
856 result
.offset_to_pos
= str_8bit_offset_to_pos
;
857 result
.column_to_pos
= str_8bit_column_to_pos
;
858 result
.create_search_needle
= str_8bit_create_search_needle
;
859 result
.release_search_needle
= str_8bit_release_search_needle
;
860 result
.search_first
= str_8bit_search_first
;
861 result
.search_last
= str_8bit_search_last
;
862 result
.compare
= str_8bit_compare
;
863 result
.ncompare
= str_8bit_ncompare
;
864 result
.casecmp
= str_8bit_casecmp
;
865 result
.ncasecmp
= str_8bit_ncasecmp
;
866 result
.prefix
= str_8bit_prefix
;
867 result
.caseprefix
= str_8bit_caseprefix
;
868 result
.create_key
= str_8bit_create_key
;
869 result
.create_key_for_filename
= str_8bit_create_key
;
870 result
.key_collate
= str_8bit_key_collate
;
871 result
.release_key
= str_8bit_release_key
;
876 /* --------------------------------------------------------------------------------------------- */