1994-05-27 05:00:24 +00:00
|
|
|
.\" Copyright (c) 1989, 1991, 1993
|
|
|
|
.\" The Regents of the University of California. All rights reserved.
|
|
|
|
.\"
|
|
|
|
.\" Redistribution and use in source and binary forms, with or without
|
|
|
|
.\" modification, are permitted provided that the following conditions
|
|
|
|
.\" are met:
|
|
|
|
.\" 1. Redistributions of source code must retain the above copyright
|
|
|
|
.\" notice, this list of conditions and the following disclaimer.
|
|
|
|
.\" 2. Redistributions in binary form must reproduce the above copyright
|
|
|
|
.\" notice, this list of conditions and the following disclaimer in the
|
|
|
|
.\" documentation and/or other materials provided with the distribution.
|
|
|
|
.\" 3. All advertising materials mentioning features or use of this software
|
|
|
|
.\" must display the following acknowledgement:
|
|
|
|
.\" This product includes software developed by the University of
|
|
|
|
.\" California, Berkeley and its contributors.
|
|
|
|
.\" 4. Neither the name of the University nor the names of its contributors
|
|
|
|
.\" may be used to endorse or promote products derived from this software
|
|
|
|
.\" without specific prior written permission.
|
|
|
|
.\"
|
|
|
|
.\" THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
|
|
|
|
.\" ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
.\" IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
|
|
.\" ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
|
|
|
|
.\" FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
|
|
.\" DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
|
|
|
|
.\" OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
|
|
|
|
.\" HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
|
|
|
.\" LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
|
|
|
|
.\" OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
|
|
|
|
.\" SUCH DAMAGE.
|
|
|
|
.\"
|
|
|
|
.\" @(#)unvis.3 8.2 (Berkeley) 12/11/93
|
1999-08-28 00:22:10 +00:00
|
|
|
.\" $FreeBSD$
|
1994-05-27 05:00:24 +00:00
|
|
|
.\"
|
|
|
|
.Dd December 11, 1993
|
|
|
|
.Dt UNVIS 3
|
|
|
|
.Os
|
|
|
|
.Sh NAME
|
|
|
|
.Nm unvis ,
|
|
|
|
.Nm strunvis
|
|
|
|
.Nd decode a visual representation of characters
|
2000-04-21 09:42:15 +00:00
|
|
|
.Sh LIBRARY
|
|
|
|
.Lb libc
|
1994-05-27 05:00:24 +00:00
|
|
|
.Sh SYNOPSIS
|
2001-10-01 16:09:29 +00:00
|
|
|
.In vis.h
|
2000-07-03 08:31:02 +00:00
|
|
|
.Ft int
|
1997-04-13 13:16:20 +00:00
|
|
|
.Fn unvis "char *cp" "int c" "int *astate" "int flag"
|
2000-07-03 08:31:02 +00:00
|
|
|
.Ft int
|
1997-04-13 13:16:20 +00:00
|
|
|
.Fn strunvis "char *dst" "const char *src"
|
2000-07-03 08:31:02 +00:00
|
|
|
.Ft int
|
2000-07-02 21:31:26 +00:00
|
|
|
.Fn strunvisx "char *dst" "const char *src" "int flag"
|
1994-05-27 05:00:24 +00:00
|
|
|
.Sh DESCRIPTION
|
|
|
|
The
|
2000-07-02 21:31:26 +00:00
|
|
|
.Fn unvis ,
|
1994-05-27 05:00:24 +00:00
|
|
|
.Fn strunvis
|
2000-07-02 21:31:26 +00:00
|
|
|
and
|
|
|
|
.Fn strunvisx
|
1994-05-27 05:00:24 +00:00
|
|
|
functions
|
|
|
|
are used to decode a visual representation of characters, as produced
|
|
|
|
by the
|
|
|
|
.Xr vis 3
|
|
|
|
function, back into
|
2004-07-02 23:52:20 +00:00
|
|
|
the original form.
|
|
|
|
Unvis is called with successive characters in
|
2002-12-18 13:33:04 +00:00
|
|
|
.Fa c
|
1994-05-27 05:00:24 +00:00
|
|
|
until a valid
|
|
|
|
sequence is recognized, at which time the decoded character is
|
|
|
|
available at the character pointed to by
|
2002-12-18 13:33:04 +00:00
|
|
|
.Fa cp .
|
1994-05-27 05:00:24 +00:00
|
|
|
Strunvis decodes the
|
|
|
|
characters pointed to by
|
2002-12-18 13:33:04 +00:00
|
|
|
.Fa src
|
1994-05-27 05:00:24 +00:00
|
|
|
into the buffer pointed to by
|
2002-12-18 13:33:04 +00:00
|
|
|
.Fa dst .
|
1994-05-27 05:00:24 +00:00
|
|
|
.Pp
|
|
|
|
The
|
|
|
|
.Fn strunvis
|
|
|
|
function
|
|
|
|
simply copies
|
2002-12-18 13:33:04 +00:00
|
|
|
.Fa src
|
1994-05-27 05:00:24 +00:00
|
|
|
to
|
2002-12-18 13:33:04 +00:00
|
|
|
.Fa dst ,
|
1994-05-27 05:00:24 +00:00
|
|
|
decoding any escape sequences along the way,
|
|
|
|
and returns the number of characters placed into
|
2002-12-18 13:33:04 +00:00
|
|
|
.Fa dst ,
|
1994-05-27 05:00:24 +00:00
|
|
|
or \-1 if an
|
2004-07-02 23:52:20 +00:00
|
|
|
invalid escape sequence was detected.
|
|
|
|
The size of
|
2002-12-18 13:33:04 +00:00
|
|
|
.Fa dst
|
1994-05-27 05:00:24 +00:00
|
|
|
should be
|
|
|
|
equal to the size of
|
2002-12-18 13:33:04 +00:00
|
|
|
.Fa src
|
1994-05-27 05:00:24 +00:00
|
|
|
(that is, no expansion takes place during
|
|
|
|
decoding).
|
|
|
|
.Pp
|
|
|
|
The
|
2000-07-02 21:31:26 +00:00
|
|
|
.Fn strunvisx
|
|
|
|
function does the same as the
|
|
|
|
.Fn strunvis
|
2000-07-03 08:28:30 +00:00
|
|
|
function,
|
|
|
|
but it allows you to add a flag that specifies the style the string
|
2002-12-18 13:33:04 +00:00
|
|
|
.Fa src
|
2000-07-02 21:31:26 +00:00
|
|
|
is encoded with.
|
|
|
|
Currently, the only supported flag is
|
|
|
|
.Dv VIS_HTTPSTYLE .
|
|
|
|
.Pp
|
|
|
|
The
|
1994-05-27 05:00:24 +00:00
|
|
|
.Fn unvis
|
|
|
|
function
|
|
|
|
implements a state machine that can be used to decode an arbitrary
|
2004-07-02 23:52:20 +00:00
|
|
|
stream of bytes.
|
|
|
|
All state associated with the bytes being decoded
|
1994-05-27 05:00:24 +00:00
|
|
|
is stored outside the
|
|
|
|
.Fn unvis
|
|
|
|
function (that is, a pointer to the state is passed in), so
|
2004-07-02 23:52:20 +00:00
|
|
|
calls decoding different streams can be freely intermixed.
|
|
|
|
To
|
1994-05-27 05:00:24 +00:00
|
|
|
start decoding a stream of bytes, first initialize an integer
|
2004-07-02 23:52:20 +00:00
|
|
|
to zero.
|
|
|
|
Call
|
1994-05-27 05:00:24 +00:00
|
|
|
.Fn unvis
|
|
|
|
with each successive byte, along with a pointer
|
|
|
|
to this integer, and a pointer to a destination character.
|
|
|
|
The
|
1996-03-27 20:49:07 +00:00
|
|
|
.Fn unvis
|
1994-05-27 05:00:24 +00:00
|
|
|
function
|
2004-07-02 23:52:20 +00:00
|
|
|
has several return codes that must be handled properly.
|
|
|
|
They are:
|
1994-05-27 05:00:24 +00:00
|
|
|
.Bl -tag -width UNVIS_VALIDPUSH
|
|
|
|
.It Li \&0 (zero)
|
|
|
|
Another character is necessary; nothing has been recognized yet.
|
2004-07-03 22:30:10 +00:00
|
|
|
.It Dv UNVIS_VALID
|
1994-05-27 05:00:24 +00:00
|
|
|
A valid character has been recognized and is available at the location
|
|
|
|
pointed to by cp.
|
2004-07-03 22:30:10 +00:00
|
|
|
.It Dv UNVIS_VALIDPUSH
|
1994-05-27 05:00:24 +00:00
|
|
|
A valid character has been recognized and is available at the location
|
|
|
|
pointed to by cp; however, the character currently passed in should
|
|
|
|
be passed in again.
|
2004-07-03 22:30:10 +00:00
|
|
|
.It Dv UNVIS_NOCHAR
|
2004-07-02 23:52:20 +00:00
|
|
|
A valid sequence was detected, but no character was produced.
|
|
|
|
This
|
1994-05-27 05:00:24 +00:00
|
|
|
return code is necessary to indicate a logical break between characters.
|
2004-07-03 22:30:10 +00:00
|
|
|
.It Dv UNVIS_SYNBAD
|
1994-05-27 05:00:24 +00:00
|
|
|
An invalid escape sequence was detected, or the decoder is in an
|
2004-07-02 23:52:20 +00:00
|
|
|
unknown state.
|
|
|
|
The decoder is placed into the starting state.
|
1994-05-27 05:00:24 +00:00
|
|
|
.El
|
|
|
|
.Pp
|
|
|
|
When all bytes in the stream have been processed, call
|
|
|
|
.Fn unvis
|
2000-07-02 21:31:26 +00:00
|
|
|
one more time with
|
2002-12-18 13:33:04 +00:00
|
|
|
.Fa flag
|
2000-07-02 21:31:26 +00:00
|
|
|
set to
|
1994-05-27 05:00:24 +00:00
|
|
|
.Dv UNVIS_END
|
|
|
|
to extract any remaining character (the character passed in is ignored).
|
|
|
|
.Pp
|
2000-07-02 21:31:26 +00:00
|
|
|
The
|
2002-12-18 13:33:04 +00:00
|
|
|
.Fa flag
|
2000-07-02 21:31:26 +00:00
|
|
|
argument is also used to specify the encoding style of the source.
|
|
|
|
If set to
|
|
|
|
.Dv VIS_HTTPSTYLE ,
|
|
|
|
.Fn unvis
|
|
|
|
will decode URI strings as specified in RFC 1808.
|
|
|
|
.Pp
|
1994-05-27 05:00:24 +00:00
|
|
|
The following code fragment illustrates a proper use of
|
|
|
|
.Fn unvis .
|
|
|
|
.Bd -literal -offset indent
|
|
|
|
int state = 0;
|
|
|
|
char out;
|
|
|
|
|
|
|
|
while ((ch = getchar()) != EOF) {
|
|
|
|
again:
|
|
|
|
switch(unvis(&out, ch, &state, 0)) {
|
|
|
|
case 0:
|
|
|
|
case UNVIS_NOCHAR:
|
|
|
|
break;
|
|
|
|
case UNVIS_VALID:
|
|
|
|
(void) putchar(out);
|
|
|
|
break;
|
|
|
|
case UNVIS_VALIDPUSH:
|
|
|
|
(void) putchar(out);
|
|
|
|
goto again;
|
|
|
|
case UNVIS_SYNBAD:
|
2000-12-29 14:08:20 +00:00
|
|
|
(void)fprintf(stderr, "bad sequence!\en");
|
1994-05-27 05:00:24 +00:00
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (unvis(&out, (char)0, &state, UNVIS_END) == UNVIS_VALID)
|
|
|
|
(void) putchar(out);
|
|
|
|
.Ed
|
|
|
|
.Sh SEE ALSO
|
2000-07-03 08:26:50 +00:00
|
|
|
.Xr vis 1 ,
|
|
|
|
.Xr vis 3
|
|
|
|
.Rs
|
|
|
|
.%A R. Fielding
|
|
|
|
.%T Relative Uniform Resource Locators
|
|
|
|
.%O RFC1808
|
|
|
|
.Re
|
1994-05-27 05:00:24 +00:00
|
|
|
.Sh HISTORY
|
|
|
|
The
|
2000-11-20 14:11:46 +00:00
|
|
|
.Fn unvis
|
1994-05-27 05:00:24 +00:00
|
|
|
function
|
1996-08-22 23:31:07 +00:00
|
|
|
first appeared in
|
|
|
|
.Bx 4.4 .
|