2004-04-08 09:59:02 +00:00
|
|
|
.\" Copyright (c) 2002-2004 Tim J. Robbins
|
2002-08-18 06:30:10 +00:00
|
|
|
.\" All rights reserved.
|
|
|
|
.\"
|
|
|
|
.\" Redistribution and use in source and binary forms, with or without
|
|
|
|
.\" modification, are permitted provided that the following conditions
|
|
|
|
.\" are met:
|
|
|
|
.\" 1. Redistributions of source code must retain the above copyright
|
|
|
|
.\" notice, this list of conditions and the following disclaimer.
|
|
|
|
.\" 2. Redistributions in binary form must reproduce the above copyright
|
|
|
|
.\" notice, this list of conditions and the following disclaimer in the
|
|
|
|
.\" documentation and/or other materials provided with the distribution.
|
|
|
|
.\"
|
|
|
|
.\" THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
|
|
|
|
.\" ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
.\" IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
|
|
.\" ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
|
|
|
|
.\" FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
|
|
.\" DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
|
|
|
|
.\" OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
|
|
|
|
.\" HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
|
|
|
.\" LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
|
|
|
|
.\" OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
|
|
|
|
.\" SUCH DAMAGE.
|
|
|
|
.\"
|
|
|
|
.\" $FreeBSD$
|
2002-11-29 17:35:09 +00:00
|
|
|
.\"
|
2004-04-08 09:59:02 +00:00
|
|
|
.Dd April 7, 2004
|
2002-08-18 06:30:10 +00:00
|
|
|
.Dt MBRLEN 3
|
|
|
|
.Os
|
|
|
|
.Sh NAME
|
|
|
|
.Nm mbrlen
|
|
|
|
.Nd "get number of bytes in a character (restartable)"
|
|
|
|
.Sh LIBRARY
|
|
|
|
.Lb libc
|
|
|
|
.Sh SYNOPSIS
|
|
|
|
.In wchar.h
|
|
|
|
.Ft size_t
|
2002-09-06 11:24:06 +00:00
|
|
|
.Fn mbrlen "const char * restrict s" "size_t n" "mbstate_t * restrict ps"
|
2002-08-18 06:30:10 +00:00
|
|
|
.Sh DESCRIPTION
|
|
|
|
The
|
|
|
|
.Fn mbrlen
|
2004-04-08 09:59:02 +00:00
|
|
|
function inspects at most
|
2002-11-09 10:21:01 +00:00
|
|
|
.Fa n
|
2004-04-08 09:59:02 +00:00
|
|
|
bytes pointed to by
|
|
|
|
.Fa s
|
|
|
|
to determine the number of bytes needed to complete the next
|
|
|
|
multibyte character.
|
2002-11-09 10:21:01 +00:00
|
|
|
.Pp
|
|
|
|
The
|
2002-11-29 17:35:09 +00:00
|
|
|
.Vt mbstate_t
|
2002-11-09 10:21:01 +00:00
|
|
|
argument,
|
|
|
|
.Fa ps ,
|
|
|
|
is used to keep track of the shift state.
|
|
|
|
If it is
|
|
|
|
.Dv NULL ,
|
|
|
|
.Fn mbrlen
|
|
|
|
uses an internal, static
|
2002-11-29 17:35:09 +00:00
|
|
|
.Vt mbstate_t
|
2004-04-08 09:59:02 +00:00
|
|
|
object, which is initialized to the initial conversion state
|
|
|
|
at program startup.
|
2002-08-18 06:30:10 +00:00
|
|
|
.Pp
|
|
|
|
It is equivalent to:
|
|
|
|
.Pp
|
|
|
|
.Dl "mbrtowc(NULL, s, n, ps);"
|
|
|
|
.Pp
|
|
|
|
Except that when
|
|
|
|
.Fa ps
|
2002-11-29 17:35:09 +00:00
|
|
|
is a
|
|
|
|
.Dv NULL
|
|
|
|
pointer,
|
2002-08-18 06:30:10 +00:00
|
|
|
.Fn mbrlen
|
|
|
|
uses its own static, internal
|
2002-11-29 17:35:09 +00:00
|
|
|
.Vt mbstate_t
|
|
|
|
object to keep track of the shift state.
|
2002-08-18 06:30:10 +00:00
|
|
|
.Sh RETURN VALUES
|
|
|
|
The
|
|
|
|
.Fn mbrlen
|
|
|
|
functions returns:
|
|
|
|
.Bl -tag -width indent
|
|
|
|
.It 0
|
2004-04-08 09:59:02 +00:00
|
|
|
The next
|
2002-08-18 06:30:10 +00:00
|
|
|
.Fa n
|
2004-04-08 09:59:02 +00:00
|
|
|
or fewer bytes
|
2002-11-29 17:35:09 +00:00
|
|
|
represent the null wide character
|
|
|
|
.Pq Li "L'\e0'" .
|
2002-08-18 06:30:10 +00:00
|
|
|
.It >0
|
2004-04-08 09:59:02 +00:00
|
|
|
The next
|
2002-08-18 06:30:10 +00:00
|
|
|
.Fa n
|
2004-04-08 09:59:02 +00:00
|
|
|
or fewer bytes
|
2002-08-18 06:30:10 +00:00
|
|
|
represent a valid character,
|
2004-04-08 09:59:02 +00:00
|
|
|
.Fn mbrlen
|
|
|
|
returns the number of bytes used to complete the multibyte character.
|
2002-11-29 17:35:09 +00:00
|
|
|
.It Po Vt size_t Pc Ns \-2
|
2004-04-08 09:59:02 +00:00
|
|
|
The next
|
2002-08-18 06:30:10 +00:00
|
|
|
.Fa n
|
2004-04-08 09:59:02 +00:00
|
|
|
contribute to, but do not complete, a valid multibyte character sequence,
|
|
|
|
and all
|
|
|
|
.Fa n
|
|
|
|
bytes have been processed.
|
2002-11-29 17:35:09 +00:00
|
|
|
.It Po Vt size_t Pc Ns \-1
|
2004-04-08 09:59:02 +00:00
|
|
|
An encoding error has occurred.
|
|
|
|
The next
|
2004-06-30 19:32:41 +00:00
|
|
|
.Fa n
|
2004-04-08 09:59:02 +00:00
|
|
|
or fewer bytes do not contribute to a valid multibyte character.
|
2002-08-18 06:30:10 +00:00
|
|
|
.El
|
2002-10-03 14:07:26 +00:00
|
|
|
.Sh EXAMPLES
|
2004-04-08 09:59:02 +00:00
|
|
|
A function that calculates the number of characters in a multibyte
|
2002-10-03 14:07:26 +00:00
|
|
|
character string:
|
|
|
|
.Bd -literal -offset indent
|
|
|
|
size_t
|
|
|
|
nchars(const char *s)
|
|
|
|
{
|
|
|
|
size_t charlen, chars;
|
|
|
|
mbstate_t mbs;
|
|
|
|
|
|
|
|
chars = 0;
|
|
|
|
memset(&mbs, 0, sizeof(mbs));
|
|
|
|
while ((charlen = mbrlen(s, MB_CUR_MAX, &mbs)) != 0 &&
|
|
|
|
charlen != (size_t)-1 && charlen != (size_t)-2) {
|
|
|
|
s += charlen;
|
|
|
|
chars++;
|
|
|
|
}
|
|
|
|
|
|
|
|
return (chars);
|
|
|
|
}
|
|
|
|
.Ed
|
2002-08-18 06:30:10 +00:00
|
|
|
.Sh ERRORS
|
|
|
|
The
|
|
|
|
.Fn mbrlen
|
|
|
|
function will fail if:
|
|
|
|
.Bl -tag -width Er
|
|
|
|
.It Bq Er EILSEQ
|
|
|
|
An invalid multibyte sequence was detected.
|
2004-04-08 09:59:02 +00:00
|
|
|
.It Bq Er EINVAL
|
|
|
|
The conversion state is invalid.
|
2002-08-18 06:30:10 +00:00
|
|
|
.El
|
|
|
|
.Sh SEE ALSO
|
|
|
|
.Xr mblen 3 ,
|
2004-04-08 09:59:02 +00:00
|
|
|
.Xr mbrtowc 3 ,
|
|
|
|
.Xr multibyte 3
|
2002-08-18 06:30:10 +00:00
|
|
|
.Sh STANDARDS
|
|
|
|
The
|
|
|
|
.Fn mbrlen
|
|
|
|
function conforms to
|
|
|
|
.St -isoC-99 .
|