2002-08-18 06:30:10 +00:00
|
|
|
.\" Copyright (c) 2002 Tim J. Robbins
|
|
|
|
.\" All rights reserved.
|
|
|
|
.\"
|
|
|
|
.\" Redistribution and use in source and binary forms, with or without
|
|
|
|
.\" modification, are permitted provided that the following conditions
|
|
|
|
.\" are met:
|
|
|
|
.\" 1. Redistributions of source code must retain the above copyright
|
|
|
|
.\" notice, this list of conditions and the following disclaimer.
|
|
|
|
.\" 2. Redistributions in binary form must reproduce the above copyright
|
|
|
|
.\" notice, this list of conditions and the following disclaimer in the
|
|
|
|
.\" documentation and/or other materials provided with the distribution.
|
|
|
|
.\"
|
|
|
|
.\" THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
|
|
|
|
.\" ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
.\" IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
|
|
.\" ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
|
|
|
|
.\" FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
|
|
.\" DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
|
|
|
|
.\" OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
|
|
|
|
.\" HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
|
|
|
.\" LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
|
|
|
|
.\" OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
|
|
|
|
.\" SUCH DAMAGE.
|
|
|
|
.\"
|
|
|
|
.\" $FreeBSD$
|
2002-11-29 17:35:09 +00:00
|
|
|
.\"
|
2002-11-09 10:21:01 +00:00
|
|
|
.Dd November 11, 2002
|
2002-08-18 06:30:10 +00:00
|
|
|
.Dt MBRLEN 3
|
|
|
|
.Os
|
|
|
|
.Sh NAME
|
|
|
|
.Nm mbrlen
|
|
|
|
.Nd "get number of bytes in a character (restartable)"
|
|
|
|
.Sh LIBRARY
|
|
|
|
.Lb libc
|
|
|
|
.Sh SYNOPSIS
|
|
|
|
.In wchar.h
|
|
|
|
.Ft size_t
|
2002-09-06 11:24:06 +00:00
|
|
|
.Fn mbrlen "const char * restrict s" "size_t n" "mbstate_t * restrict ps"
|
2002-08-18 06:30:10 +00:00
|
|
|
.Sh DESCRIPTION
|
|
|
|
The
|
|
|
|
.Fn mbrlen
|
2002-11-29 17:35:09 +00:00
|
|
|
function determines the number of bytes constituting the
|
2002-11-09 09:47:06 +00:00
|
|
|
multibyte character sequence pointed to by
|
2002-11-09 10:21:01 +00:00
|
|
|
.Fa s ,
|
|
|
|
examining at most
|
|
|
|
.Fa n
|
|
|
|
bytes.
|
|
|
|
.Pp
|
|
|
|
The
|
2002-11-29 17:35:09 +00:00
|
|
|
.Vt mbstate_t
|
2002-11-09 10:21:01 +00:00
|
|
|
argument,
|
|
|
|
.Fa ps ,
|
|
|
|
is used to keep track of the shift state.
|
|
|
|
If it is
|
|
|
|
.Dv NULL ,
|
|
|
|
.Fn mbrlen
|
|
|
|
uses an internal, static
|
2002-11-29 17:35:09 +00:00
|
|
|
.Vt mbstate_t
|
2002-11-09 10:21:01 +00:00
|
|
|
object.
|
2002-08-18 06:30:10 +00:00
|
|
|
.Pp
|
|
|
|
It is equivalent to:
|
|
|
|
.Pp
|
|
|
|
.Dl "mbrtowc(NULL, s, n, ps);"
|
|
|
|
.Pp
|
|
|
|
Except that when
|
|
|
|
.Fa ps
|
2002-11-29 17:35:09 +00:00
|
|
|
is a
|
|
|
|
.Dv NULL
|
|
|
|
pointer,
|
2002-08-18 06:30:10 +00:00
|
|
|
.Fn mbrlen
|
|
|
|
uses its own static, internal
|
2002-11-29 17:35:09 +00:00
|
|
|
.Vt mbstate_t
|
|
|
|
object to keep track of the shift state.
|
2002-08-18 06:30:10 +00:00
|
|
|
.Sh RETURN VALUES
|
|
|
|
The
|
|
|
|
.Fn mbrlen
|
|
|
|
functions returns:
|
|
|
|
.Bl -tag -width indent
|
|
|
|
.It 0
|
|
|
|
The first
|
|
|
|
.Fa n
|
|
|
|
or fewer bytes of
|
|
|
|
.Fa s
|
2002-11-29 17:35:09 +00:00
|
|
|
represent the null wide character
|
|
|
|
.Pq Li "L'\e0'" .
|
2002-08-18 06:30:10 +00:00
|
|
|
.It >0
|
|
|
|
The first
|
|
|
|
.Fa n
|
|
|
|
or fewer bytes of
|
|
|
|
.Fa s
|
|
|
|
represent a valid character,
|
|
|
|
.Fn mbrtowc
|
|
|
|
returns the length (in bytes) of the multibyte sequence.
|
2002-11-29 17:35:09 +00:00
|
|
|
.It Po Vt size_t Pc Ns \-2
|
2002-08-18 06:30:10 +00:00
|
|
|
The first
|
|
|
|
.Fa n
|
|
|
|
bytes of
|
|
|
|
.Fa s
|
|
|
|
are an incomplete multibyte sequence.
|
2002-11-29 17:35:09 +00:00
|
|
|
.It Po Vt size_t Pc Ns \-1
|
2002-08-18 06:30:10 +00:00
|
|
|
The byte sequence pointed to by
|
|
|
|
.Fa s
|
|
|
|
is an invalid multibyte sequence.
|
|
|
|
.El
|
2002-10-03 14:07:26 +00:00
|
|
|
.Sh EXAMPLES
|
|
|
|
A function which calculates the number of characters in a multibyte
|
|
|
|
character string:
|
|
|
|
.Bd -literal -offset indent
|
|
|
|
size_t
|
|
|
|
nchars(const char *s)
|
|
|
|
{
|
|
|
|
size_t charlen, chars;
|
|
|
|
mbstate_t mbs;
|
|
|
|
|
|
|
|
chars = 0;
|
|
|
|
memset(&mbs, 0, sizeof(mbs));
|
|
|
|
while ((charlen = mbrlen(s, MB_CUR_MAX, &mbs)) != 0 &&
|
|
|
|
charlen != (size_t)-1 && charlen != (size_t)-2) {
|
|
|
|
s += charlen;
|
|
|
|
chars++;
|
|
|
|
}
|
|
|
|
|
|
|
|
return (chars);
|
|
|
|
}
|
|
|
|
.Ed
|
2002-08-18 06:30:10 +00:00
|
|
|
.Sh ERRORS
|
|
|
|
The
|
|
|
|
.Fn mbrlen
|
|
|
|
function will fail if:
|
|
|
|
.Bl -tag -width Er
|
|
|
|
.\".It Bq Er EINVAL
|
|
|
|
.\"Invalid argument.
|
|
|
|
.It Bq Er EILSEQ
|
|
|
|
An invalid multibyte sequence was detected.
|
|
|
|
.El
|
|
|
|
.Sh SEE ALSO
|
|
|
|
.Xr mblen 3 ,
|
|
|
|
.Xr mbrtowc 3
|
|
|
|
.Sh STANDARDS
|
|
|
|
The
|
|
|
|
.Fn mbrlen
|
|
|
|
function conforms to
|
|
|
|
.St -isoC-99 .
|
|
|
|
.Sh BUGS
|
|
|
|
The current implementation does not support shift states.
|