5f2a1d6536
This is the gsoc-2011 project to clean up and backport multibyte support from other nvi forks in a form we can use. USE_WIDECHAR is on unless building for the rescue crunchgen. This should allow editing in the native locale encoding. USE_ICONV depends on make.conf having 'WITH_ICONV=YES' for now. This adds the ability to do things like edit a KOI8-R file while having $LANG set to (say) en_US.UTF-8. iconv is used to transcode the characters for display. Other points: * It uses gencat and catopen/etc instead of homegrown msg catalog stuff. * A lot of stuff has been trimmed out, eg: the perl and tcl bindings which we could never use in base anyway. * It uses ncursesw when in widechar mode. This could be interesting. GSoC info: http://www.google-melange.com/gsoc/proposal/review/google/gsoc2011/zy/1 Repo at: https://github.com/lichray/nvi2 Obtained from: Zhihao Yuan <lichray@gmail.com>
223 lines
4.6 KiB
C
223 lines
4.6 KiB
C
/*-
|
|
* Copyright (c) 1992, 1993, 1994
|
|
* The Regents of the University of California. All rights reserved.
|
|
* Copyright (c) 1992, 1993, 1994, 1995, 1996
|
|
* Keith Bostic. All rights reserved.
|
|
*
|
|
* See the LICENSE file for redistribution information.
|
|
*/
|
|
|
|
#include "config.h"
|
|
|
|
#ifndef lint
|
|
static const char sccsid[] = "$Id: getc.c,v 10.13 2011/12/27 00:49:31 zy Exp $";
|
|
#endif /* not lint */
|
|
|
|
#include <sys/types.h>
|
|
#include <sys/queue.h>
|
|
#include <sys/time.h>
|
|
|
|
#include <bitstring.h>
|
|
#include <ctype.h>
|
|
#include <limits.h>
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
|
|
#include "../common/common.h"
|
|
#include "vi.h"
|
|
|
|
/*
|
|
* Character stream routines --
|
|
* These routines return the file a character at a time. There are two
|
|
* special cases. First, the end of a line, end of a file, start of a
|
|
* file and empty lines are returned as special cases, and no character
|
|
* is returned. Second, empty lines include lines that have only white
|
|
* space in them, because the vi search functions don't care about white
|
|
* space, and this makes it easier for them to be consistent.
|
|
*/
|
|
|
|
/*
|
|
* cs_init --
|
|
* Initialize character stream routines.
|
|
*
|
|
* PUBLIC: int cs_init __P((SCR *, VCS *));
|
|
*/
|
|
int
|
|
cs_init(SCR *sp, VCS *csp)
|
|
{
|
|
int isempty;
|
|
|
|
if (db_eget(sp, csp->cs_lno, &csp->cs_bp, &csp->cs_len, &isempty)) {
|
|
if (isempty)
|
|
msgq(sp, M_BERR, "177|Empty file");
|
|
return (1);
|
|
}
|
|
if (csp->cs_len == 0 || v_isempty(csp->cs_bp, csp->cs_len)) {
|
|
csp->cs_cno = 0;
|
|
csp->cs_flags = CS_EMP;
|
|
} else {
|
|
csp->cs_flags = 0;
|
|
csp->cs_ch = csp->cs_bp[csp->cs_cno];
|
|
}
|
|
return (0);
|
|
}
|
|
|
|
/*
|
|
* cs_next --
|
|
* Retrieve the next character.
|
|
*
|
|
* PUBLIC: int cs_next __P((SCR *, VCS *));
|
|
*/
|
|
int
|
|
cs_next(SCR *sp, VCS *csp)
|
|
{
|
|
CHAR_T *p;
|
|
|
|
switch (csp->cs_flags) {
|
|
case CS_EMP: /* EMP; get next line. */
|
|
case CS_EOL: /* EOL; get next line. */
|
|
if (db_get(sp, ++csp->cs_lno, 0, &p, &csp->cs_len)) {
|
|
--csp->cs_lno;
|
|
csp->cs_flags = CS_EOF;
|
|
} else {
|
|
csp->cs_bp = p;
|
|
if (csp->cs_len == 0 ||
|
|
v_isempty(csp->cs_bp, csp->cs_len)) {
|
|
csp->cs_cno = 0;
|
|
csp->cs_flags = CS_EMP;
|
|
} else {
|
|
csp->cs_flags = 0;
|
|
csp->cs_ch = csp->cs_bp[csp->cs_cno = 0];
|
|
}
|
|
}
|
|
break;
|
|
case 0:
|
|
if (csp->cs_cno == csp->cs_len - 1)
|
|
csp->cs_flags = CS_EOL;
|
|
else
|
|
csp->cs_ch = csp->cs_bp[++csp->cs_cno];
|
|
break;
|
|
case CS_EOF: /* EOF. */
|
|
break;
|
|
default:
|
|
abort();
|
|
/* NOTREACHED */
|
|
}
|
|
return (0);
|
|
}
|
|
|
|
/*
|
|
* cs_fspace --
|
|
* If on a space, eat forward until something other than a
|
|
* whitespace character.
|
|
*
|
|
* XXX
|
|
* Semantics of checking the current character were coded for the fword()
|
|
* function -- once the other word routines are converted, they may have
|
|
* to change.
|
|
*
|
|
* PUBLIC: int cs_fspace __P((SCR *, VCS *));
|
|
*/
|
|
int
|
|
cs_fspace(SCR *sp, VCS *csp)
|
|
{
|
|
if (csp->cs_flags != 0 || !ISBLANK(csp->cs_ch))
|
|
return (0);
|
|
for (;;) {
|
|
if (cs_next(sp, csp))
|
|
return (1);
|
|
if (csp->cs_flags != 0 || !ISBLANK(csp->cs_ch))
|
|
break;
|
|
}
|
|
return (0);
|
|
}
|
|
|
|
/*
|
|
* cs_fblank --
|
|
* Eat forward to the next non-whitespace character.
|
|
*
|
|
* PUBLIC: int cs_fblank __P((SCR *, VCS *));
|
|
*/
|
|
int
|
|
cs_fblank(SCR *sp, VCS *csp)
|
|
{
|
|
for (;;) {
|
|
if (cs_next(sp, csp))
|
|
return (1);
|
|
if (csp->cs_flags == CS_EOL || csp->cs_flags == CS_EMP ||
|
|
(csp->cs_flags == 0 && ISBLANK(csp->cs_ch)))
|
|
continue;
|
|
break;
|
|
}
|
|
return (0);
|
|
}
|
|
|
|
/*
|
|
* cs_prev --
|
|
* Retrieve the previous character.
|
|
*
|
|
* PUBLIC: int cs_prev __P((SCR *, VCS *));
|
|
*/
|
|
int
|
|
cs_prev(SCR *sp, VCS *csp)
|
|
{
|
|
switch (csp->cs_flags) {
|
|
case CS_EMP: /* EMP; get previous line. */
|
|
case CS_EOL: /* EOL; get previous line. */
|
|
if (csp->cs_lno == 1) { /* SOF. */
|
|
csp->cs_flags = CS_SOF;
|
|
break;
|
|
}
|
|
if (db_get(sp, /* The line should exist. */
|
|
--csp->cs_lno, DBG_FATAL, &csp->cs_bp, &csp->cs_len)) {
|
|
++csp->cs_lno;
|
|
return (1);
|
|
}
|
|
if (csp->cs_len == 0 || v_isempty(csp->cs_bp, csp->cs_len)) {
|
|
csp->cs_cno = 0;
|
|
csp->cs_flags = CS_EMP;
|
|
} else {
|
|
csp->cs_flags = 0;
|
|
csp->cs_cno = csp->cs_len - 1;
|
|
csp->cs_ch = csp->cs_bp[csp->cs_cno];
|
|
}
|
|
break;
|
|
case CS_EOF: /* EOF: get previous char. */
|
|
case 0:
|
|
if (csp->cs_cno == 0)
|
|
if (csp->cs_lno == 1)
|
|
csp->cs_flags = CS_SOF;
|
|
else
|
|
csp->cs_flags = CS_EOL;
|
|
else
|
|
csp->cs_ch = csp->cs_bp[--csp->cs_cno];
|
|
break;
|
|
case CS_SOF: /* SOF. */
|
|
break;
|
|
default:
|
|
abort();
|
|
/* NOTREACHED */
|
|
}
|
|
return (0);
|
|
}
|
|
|
|
/*
|
|
* cs_bblank --
|
|
* Eat backward to the next non-whitespace character.
|
|
*
|
|
* PUBLIC: int cs_bblank __P((SCR *, VCS *));
|
|
*/
|
|
int
|
|
cs_bblank(SCR *sp, VCS *csp)
|
|
{
|
|
for (;;) {
|
|
if (cs_prev(sp, csp))
|
|
return (1);
|
|
if (csp->cs_flags == CS_EOL || csp->cs_flags == CS_EMP ||
|
|
(csp->cs_flags == 0 && ISBLANK(csp->cs_ch)))
|
|
continue;
|
|
break;
|
|
}
|
|
return (0);
|
|
}
|