hush/include/unicode.h
Denys Vlasenko 9f93d62192 libbb: better unicode width support. Hopefully fixes bug 839.
Also opens up a possibility to make other unicode stuff smaller
and more correct later. but:

function                                             old     new   delta
static.combining                                       -     516    +516
bb_wcwidth                                             -     328    +328
unicode_cut_nchars                                     -     141    +141
mbstowc_internal                                       -      93     +93
in_table                                               -      78     +78
cal_main                                             899     961     +62
static.combining0x10000                                -      40     +40
unicode_strlen                                         -      31     +31
bb_mbstrlen                                           31       -     -31
bb_mbstowcs                                          173     102     -71
------------------------------------------------------------------------------
(add/remove: 7/1 grow/shrink: 1/1 up/down: 1289/-102)        Total: 1187 bytes

Uses code of Markus Kuhn, which is in public domain:
http://www.cl.cam.ac.uk/~mgk25/ucs/wcwidth.c
"Permission to use, copy, modify, and distribute this software
 for any purpose and without fee is hereby granted. The author
 disclaims all warranties with regard to this software."

Signed-off-by: Denys Vlasenko <vda.linux@googlemail.com>
2010-01-24 07:44:03 +01:00

78 lines
1.8 KiB
C

/* vi: set sw=4 ts=4: */
/*
* Licensed under the GPL version 2, see the file LICENSE in this tarball.
*/
#ifndef UNICODE_H
#define UNICODE_H 1
enum {
UNICODE_UNKNOWN = 0,
UNICODE_OFF = 1,
UNICODE_ON = 2,
};
#if !ENABLE_FEATURE_ASSUME_UNICODE
# define unicode_strlen(string) strlen(string)
# define unicode_scrlen(string) TODO
# define unicode_status UNICODE_OFF
# define init_unicode() ((void)0)
#else
size_t FAST_FUNC unicode_strlen(const char *string);
char* FAST_FUNC unicode_cut_nchars(unsigned width, const char *src);
unsigned FAST_FUNC unicode_padding_to_width(unsigned width, const char *src);
# if ENABLE_LOCALE_SUPPORT
# include <wchar.h>
# include <wctype.h>
extern uint8_t unicode_status;
void init_unicode(void) FAST_FUNC;
# else
/* Homegrown Unicode support. It knows only C and Unicode locales. */
# if !ENABLE_FEATURE_CHECK_UNICODE_IN_ENV
# define unicode_status UNICODE_ON
# define init_unicode() ((void)0)
# else
extern uint8_t unicode_status;
void init_unicode(void) FAST_FUNC;
# endif
# undef MB_CUR_MAX
# define MB_CUR_MAX 6
/* Prevent name collisions */
# define wint_t bb_wint_t
# define mbstate_t bb_mbstate_t
# define mbstowcs bb_mbstowcs
# define wcstombs bb_wcstombs
# define wcrtomb bb_wcrtomb
# define iswspace bb_iswspace
# define iswalnum bb_iswalnum
# define iswpunct bb_iswpunct
# define wcwidth bb_wcwidth
typedef int32_t wint_t;
typedef struct {
char bogus;
} mbstate_t;
size_t mbstowcs(wchar_t *dest, const char *src, size_t n) FAST_FUNC;
size_t wcstombs(char *dest, const wchar_t *src, size_t n) FAST_FUNC;
size_t wcrtomb(char *s, wchar_t wc, mbstate_t *ps) FAST_FUNC;
int iswspace(wint_t wc) FAST_FUNC;
int iswalnum(wint_t wc) FAST_FUNC;
int iswpunct(wint_t wc) FAST_FUNC;
# endif /* !LOCALE_SUPPORT */
#endif /* FEATURE_ASSUME_UNICODE */
#endif