xref: /freebsd/contrib/less/line.c (revision 720c436c669bf5f7405777dcd50575bf6651e0f8)
11d5cfebaSTim J. Robbins /* $FreeBSD$ */
2a5f0fb15SPaul Saab /*
3720c436cSXin LI  * Copyright (C) 1984-2007  Mark Nudelman
4a5f0fb15SPaul Saab  *
5a5f0fb15SPaul Saab  * You may distribute under the terms of either the GNU General Public
6a5f0fb15SPaul Saab  * License or the Less License, as specified in the README file.
7a5f0fb15SPaul Saab  *
8a5f0fb15SPaul Saab  * For more information about less, or for information on how to
9a5f0fb15SPaul Saab  * contact the author, see the README file.
10a5f0fb15SPaul Saab  */
11a5f0fb15SPaul Saab 
12a5f0fb15SPaul Saab 
13a5f0fb15SPaul Saab /*
14a5f0fb15SPaul Saab  * Routines to manipulate the "line buffer".
15a5f0fb15SPaul Saab  * The line buffer holds a line of output as it is being built
16a5f0fb15SPaul Saab  * in preparation for output to the screen.
17a5f0fb15SPaul Saab  */
18a5f0fb15SPaul Saab 
19a5f0fb15SPaul Saab #include "less.h"
2089dd99dcSXin LI #include "charset.h"
21a5f0fb15SPaul Saab 
2289dd99dcSXin LI static char *linebuf = NULL;	/* Buffer which holds the current output line */
23c9346414SPaul Saab static char *attr = NULL;	/* Extension of linebuf to hold attributes */
24c9346414SPaul Saab public int size_linebuf = 0;	/* Size of line buffer (and attr buffer) */
25a5f0fb15SPaul Saab 
2689dd99dcSXin LI static int cshift;		/* Current left-shift of output line buffer */
27a5f0fb15SPaul Saab public int hshift;		/* Desired left-shift of output line buffer */
28c9346414SPaul Saab public int tabstops[TABSTOP_MAX] = { 0 }; /* Custom tabstops */
29c9346414SPaul Saab public int ntabstops = 1;	/* Number of tabstops */
30c9346414SPaul Saab public int tabdefault = 8;	/* Default repeated tabstops */
31a5f0fb15SPaul Saab 
32a5f0fb15SPaul Saab static int curr;		/* Index into linebuf */
33a5f0fb15SPaul Saab static int column;		/* Printable length, accounting for
34a5f0fb15SPaul Saab 				   backspaces, etc. */
35a5f0fb15SPaul Saab static int overstrike;		/* Next char should overstrike previous char */
36000ba3e8STim J. Robbins static int last_overstrike = AT_NORMAL;
37a5f0fb15SPaul Saab static int is_null_line;	/* There is no current line */
388ed69c6fSPaul Saab static int lmargin;		/* Left margin */
3989dd99dcSXin LI static int line_matches;	/* Number of search matches in this line */
40a5f0fb15SPaul Saab static char pendc;
41a5f0fb15SPaul Saab static POSITION pendpos;
42a5f0fb15SPaul Saab static char *end_ansi_chars;
4389dd99dcSXin LI static char *mid_ansi_chars;
44a5f0fb15SPaul Saab 
4589dd99dcSXin LI static int attr_swidth();
4689dd99dcSXin LI static int attr_ewidth();
47a5f0fb15SPaul Saab static int do_append();
48a5f0fb15SPaul Saab 
4989dd99dcSXin LI extern int sigs;
50a5f0fb15SPaul Saab extern int bs_mode;
51a5f0fb15SPaul Saab extern int linenums;
52a5f0fb15SPaul Saab extern int ctldisp;
53a5f0fb15SPaul Saab extern int twiddle;
54a5f0fb15SPaul Saab extern int binattr;
558ed69c6fSPaul Saab extern int status_col;
56a5f0fb15SPaul Saab extern int auto_wrap, ignaw;
57a5f0fb15SPaul Saab extern int bo_s_width, bo_e_width;
58a5f0fb15SPaul Saab extern int ul_s_width, ul_e_width;
59a5f0fb15SPaul Saab extern int bl_s_width, bl_e_width;
60a5f0fb15SPaul Saab extern int so_s_width, so_e_width;
61a5f0fb15SPaul Saab extern int sc_width, sc_height;
62a5f0fb15SPaul Saab extern int utf_mode;
63720c436cSXin LI extern int oldbot;
648ed69c6fSPaul Saab extern POSITION start_attnpos;
658ed69c6fSPaul Saab extern POSITION end_attnpos;
66a5f0fb15SPaul Saab 
6789dd99dcSXin LI static char mbc_buf[MAX_UTF_CHAR_LEN];
6889dd99dcSXin LI static int mbc_buf_len = 0;
6989dd99dcSXin LI static int mbc_buf_index = 0;
7089dd99dcSXin LI static POSITION mbc_pos;
7189dd99dcSXin LI 
72a5f0fb15SPaul Saab /*
73a5f0fb15SPaul Saab  * Initialize from environment variables.
74a5f0fb15SPaul Saab  */
75a5f0fb15SPaul Saab 	public void
76a5f0fb15SPaul Saab init_line()
77a5f0fb15SPaul Saab {
78a5f0fb15SPaul Saab 	end_ansi_chars = lgetenv("LESSANSIENDCHARS");
79a5f0fb15SPaul Saab 	if (end_ansi_chars == NULL || *end_ansi_chars == '\0')
80a5f0fb15SPaul Saab 		end_ansi_chars = "m";
8189dd99dcSXin LI 
8289dd99dcSXin LI 	mid_ansi_chars = lgetenv("LESSANSIMIDCHARS");
8389dd99dcSXin LI 	if (mid_ansi_chars == NULL || *mid_ansi_chars == '\0')
8489dd99dcSXin LI 		mid_ansi_chars = "0123456789;[?!\"'#%()*+ ";
8589dd99dcSXin LI 
86c9346414SPaul Saab 	linebuf = (char *) ecalloc(LINEBUF_SIZE, sizeof(char));
87c9346414SPaul Saab 	attr = (char *) ecalloc(LINEBUF_SIZE, sizeof(char));
88c9346414SPaul Saab 	size_linebuf = LINEBUF_SIZE;
89c9346414SPaul Saab }
90c9346414SPaul Saab 
91c9346414SPaul Saab /*
92c9346414SPaul Saab  * Expand the line buffer.
93c9346414SPaul Saab  */
94c9346414SPaul Saab 	static int
95c9346414SPaul Saab expand_linebuf()
96c9346414SPaul Saab {
9789dd99dcSXin LI 	/* Double the size of the line buffer. */
9889dd99dcSXin LI 	int new_size = size_linebuf * 2;
9989dd99dcSXin LI 
10089dd99dcSXin LI 	/* Just realloc to expand the buffer, if we can. */
10189dd99dcSXin LI #if HAVE_REALLOC
10289dd99dcSXin LI 	char *new_buf = (char *) realloc(linebuf, new_size);
10389dd99dcSXin LI 	char *new_attr = (char *) realloc(attr, new_size);
10489dd99dcSXin LI #else
105c9346414SPaul Saab 	char *new_buf = (char *) calloc(new_size, sizeof(char));
106c9346414SPaul Saab 	char *new_attr = (char *) calloc(new_size, sizeof(char));
10789dd99dcSXin LI #endif
108c9346414SPaul Saab 	if (new_buf == NULL || new_attr == NULL)
109c9346414SPaul Saab 	{
110c9346414SPaul Saab 		if (new_attr != NULL)
111c9346414SPaul Saab 			free(new_attr);
112c9346414SPaul Saab 		if (new_buf != NULL)
113c9346414SPaul Saab 			free(new_buf);
114c9346414SPaul Saab 		return 1;
115c9346414SPaul Saab 	}
11689dd99dcSXin LI #if HAVE_REALLOC
11789dd99dcSXin LI 	/*
11889dd99dcSXin LI 	 * We realloc'd the buffers; they already have the old contents.
11989dd99dcSXin LI 	 */
12089dd99dcSXin LI 	#if 0
12189dd99dcSXin LI 	memset(new_buf + size_linebuf, 0, new_size - size_linebuf);
12289dd99dcSXin LI 	memset(new_attr + size_linebuf, 0, new_size - size_linebuf);
12389dd99dcSXin LI 	#endif
12489dd99dcSXin LI #else
12589dd99dcSXin LI 	/*
12689dd99dcSXin LI 	 * We just calloc'd the buffers; copy the old contents.
12789dd99dcSXin LI 	 */
128c9346414SPaul Saab 	memcpy(new_buf, linebuf, size_linebuf * sizeof(char));
129c9346414SPaul Saab 	memcpy(new_attr, attr, size_linebuf * sizeof(char));
130000ba3e8STim J. Robbins 	free(attr);
131000ba3e8STim J. Robbins 	free(linebuf);
13289dd99dcSXin LI #endif
133c9346414SPaul Saab 	linebuf = new_buf;
134c9346414SPaul Saab 	attr = new_attr;
135c9346414SPaul Saab 	size_linebuf = new_size;
136c9346414SPaul Saab 	return 0;
137a5f0fb15SPaul Saab }
138a5f0fb15SPaul Saab 
139a5f0fb15SPaul Saab /*
14089dd99dcSXin LI  * Is a character ASCII?
14189dd99dcSXin LI  */
14289dd99dcSXin LI 	public int
14389dd99dcSXin LI is_ascii_char(ch)
14489dd99dcSXin LI 	LWCHAR ch;
14589dd99dcSXin LI {
14689dd99dcSXin LI 	return (ch <= 0x7F);
14789dd99dcSXin LI }
14889dd99dcSXin LI 
14989dd99dcSXin LI /*
150a5f0fb15SPaul Saab  * Rewind the line buffer.
151a5f0fb15SPaul Saab  */
152a5f0fb15SPaul Saab 	public void
153a5f0fb15SPaul Saab prewind()
154a5f0fb15SPaul Saab {
155a5f0fb15SPaul Saab 	curr = 0;
156a5f0fb15SPaul Saab 	column = 0;
15789dd99dcSXin LI 	cshift = 0;
158a5f0fb15SPaul Saab 	overstrike = 0;
15989dd99dcSXin LI 	last_overstrike = AT_NORMAL;
16089dd99dcSXin LI 	mbc_buf_len = 0;
161a5f0fb15SPaul Saab 	is_null_line = 0;
162a5f0fb15SPaul Saab 	pendc = '\0';
1638ed69c6fSPaul Saab 	lmargin = 0;
164000ba3e8STim J. Robbins 	if (status_col)
165000ba3e8STim J. Robbins 		lmargin += 1;
166c9346414SPaul Saab #if HILITE_SEARCH
16789dd99dcSXin LI 	line_matches = 0;
168c9346414SPaul Saab #endif
169a5f0fb15SPaul Saab }
170a5f0fb15SPaul Saab 
171a5f0fb15SPaul Saab /*
172a5f0fb15SPaul Saab  * Insert the line number (of the given position) into the line buffer.
173a5f0fb15SPaul Saab  */
174a5f0fb15SPaul Saab 	public void
175a5f0fb15SPaul Saab plinenum(pos)
176a5f0fb15SPaul Saab 	POSITION pos;
177a5f0fb15SPaul Saab {
178000ba3e8STim J. Robbins 	register LINENUM linenum = 0;
179a5f0fb15SPaul Saab 	register int i;
180a5f0fb15SPaul Saab 
1818ed69c6fSPaul Saab 	if (linenums == OPT_ONPLUS)
1828ed69c6fSPaul Saab 	{
183a5f0fb15SPaul Saab 		/*
184a5f0fb15SPaul Saab 		 * Get the line number and put it in the current line.
185a5f0fb15SPaul Saab 		 * {{ Note: since find_linenum calls forw_raw_line,
186a5f0fb15SPaul Saab 		 *    it may seek in the input file, requiring the caller
187a5f0fb15SPaul Saab 		 *    of plinenum to re-seek if necessary. }}
1888ed69c6fSPaul Saab 		 * {{ Since forw_raw_line modifies linebuf, we must
1898ed69c6fSPaul Saab 		 *    do this first, before storing anything in linebuf. }}
190a5f0fb15SPaul Saab 		 */
191000ba3e8STim J. Robbins 		linenum = find_linenum(pos);
1928ed69c6fSPaul Saab 	}
193a5f0fb15SPaul Saab 
194a5f0fb15SPaul Saab 	/*
1958ed69c6fSPaul Saab 	 * Display a status column if the -J option is set.
196a5f0fb15SPaul Saab 	 */
1978ed69c6fSPaul Saab 	if (status_col)
1988ed69c6fSPaul Saab 	{
1998ed69c6fSPaul Saab 		linebuf[curr] = ' ';
2008ed69c6fSPaul Saab 		if (start_attnpos != NULL_POSITION &&
2018ed69c6fSPaul Saab 		    pos >= start_attnpos && pos < end_attnpos)
20289dd99dcSXin LI 			attr[curr] = AT_NORMAL|AT_HILITE;
2038ed69c6fSPaul Saab 		else
20489dd99dcSXin LI 			attr[curr] = AT_NORMAL;
2058ed69c6fSPaul Saab 		curr++;
2068ed69c6fSPaul Saab 		column++;
2078ed69c6fSPaul Saab 	}
2088ed69c6fSPaul Saab 	/*
2098ed69c6fSPaul Saab 	 * Display the line number at the start of each line
2108ed69c6fSPaul Saab 	 * if the -N option is set.
2118ed69c6fSPaul Saab 	 */
2128ed69c6fSPaul Saab 	if (linenums == OPT_ONPLUS)
2138ed69c6fSPaul Saab 	{
214000ba3e8STim J. Robbins 		char buf[INT_STRLEN_BOUND(pos) + 2];
215000ba3e8STim J. Robbins 		int n;
216000ba3e8STim J. Robbins 
217000ba3e8STim J. Robbins 		linenumtoa(linenum, buf);
218000ba3e8STim J. Robbins 		n = strlen(buf);
219000ba3e8STim J. Robbins 		if (n < MIN_LINENUM_WIDTH)
220000ba3e8STim J. Robbins 			n = MIN_LINENUM_WIDTH;
221000ba3e8STim J. Robbins 		sprintf(linebuf+curr, "%*s ", n, buf);
222000ba3e8STim J. Robbins 		n++;  /* One space after the line number. */
223000ba3e8STim J. Robbins 		for (i = 0; i < n; i++)
224000ba3e8STim J. Robbins 			attr[curr+i] = AT_NORMAL;
225000ba3e8STim J. Robbins 		curr += n;
226000ba3e8STim J. Robbins 		column += n;
227000ba3e8STim J. Robbins 		lmargin += n;
2288ed69c6fSPaul Saab 	}
229000ba3e8STim J. Robbins 
2308ed69c6fSPaul Saab 	/*
2318ed69c6fSPaul Saab 	 * Append enough spaces to bring us to the lmargin.
2328ed69c6fSPaul Saab 	 */
2338ed69c6fSPaul Saab 	while (column < lmargin)
234a5f0fb15SPaul Saab 	{
235a5f0fb15SPaul Saab 		linebuf[curr] = ' ';
236a5f0fb15SPaul Saab 		attr[curr++] = AT_NORMAL;
237a5f0fb15SPaul Saab 		column++;
2388ed69c6fSPaul Saab 	}
239a5f0fb15SPaul Saab }
240a5f0fb15SPaul Saab 
241a5f0fb15SPaul Saab /*
242a5f0fb15SPaul Saab  * Shift the input line left.
243a5f0fb15SPaul Saab  * This means discarding N printable chars at the start of the buffer.
244a5f0fb15SPaul Saab  */
245a5f0fb15SPaul Saab 	static void
246a5f0fb15SPaul Saab pshift(shift)
247a5f0fb15SPaul Saab 	int shift;
248a5f0fb15SPaul Saab {
24989dd99dcSXin LI 	LWCHAR prev_ch = 0;
25089dd99dcSXin LI 	unsigned char c;
25189dd99dcSXin LI 	int shifted = 0;
25289dd99dcSXin LI 	int to;
25389dd99dcSXin LI 	int from;
25489dd99dcSXin LI 	int len;
25589dd99dcSXin LI 	int width;
25689dd99dcSXin LI 	int prev_attr;
25789dd99dcSXin LI 	int next_attr;
258a5f0fb15SPaul Saab 
2598ed69c6fSPaul Saab 	if (shift > column - lmargin)
2608ed69c6fSPaul Saab 		shift = column - lmargin;
2618ed69c6fSPaul Saab 	if (shift > curr - lmargin)
2628ed69c6fSPaul Saab 		shift = curr - lmargin;
263a5f0fb15SPaul Saab 
26489dd99dcSXin LI 	to = from = lmargin;
26589dd99dcSXin LI 	/*
26689dd99dcSXin LI 	 * We keep on going when shifted == shift
26789dd99dcSXin LI 	 * to get all combining chars.
26889dd99dcSXin LI 	 */
26989dd99dcSXin LI 	while (shifted <= shift && from < curr)
270a5f0fb15SPaul Saab 	{
27189dd99dcSXin LI 		c = linebuf[from];
27289dd99dcSXin LI 		if (c == ESC && ctldisp == OPT_ONPLUS)
27389dd99dcSXin LI 		{
27489dd99dcSXin LI 			/* Keep cumulative effect.  */
27589dd99dcSXin LI 			linebuf[to] = c;
27689dd99dcSXin LI 			attr[to++] = attr[from++];
27789dd99dcSXin LI 			while (from < curr && linebuf[from])
27889dd99dcSXin LI 			{
27989dd99dcSXin LI 				linebuf[to] = linebuf[from];
28089dd99dcSXin LI 				attr[to++] = attr[from];
28189dd99dcSXin LI 				if (!is_ansi_middle(linebuf[from++]))
28289dd99dcSXin LI 					break;
283a5f0fb15SPaul Saab 			}
28489dd99dcSXin LI 			continue;
28589dd99dcSXin LI 		}
28689dd99dcSXin LI 
28789dd99dcSXin LI 		width = 0;
28889dd99dcSXin LI 
28989dd99dcSXin LI 		if (!IS_ASCII_OCTET(c) && utf_mode)
29089dd99dcSXin LI 		{
29189dd99dcSXin LI 			/* Assumes well-formedness validation already done.  */
29289dd99dcSXin LI 			LWCHAR ch;
29389dd99dcSXin LI 
29489dd99dcSXin LI 			len = utf_len(c);
29589dd99dcSXin LI 			if (from + len > curr)
29689dd99dcSXin LI 				break;
29789dd99dcSXin LI 			ch = get_wchar(linebuf + from);
29889dd99dcSXin LI 			if (!is_composing_char(ch) && !is_combining_char(prev_ch, ch))
29989dd99dcSXin LI 				width = is_wide_char(ch) ? 2 : 1;
30089dd99dcSXin LI 			prev_ch = ch;
30189dd99dcSXin LI 		} else
30289dd99dcSXin LI 		{
30389dd99dcSXin LI 			len = 1;
30489dd99dcSXin LI 			if (c == '\b')
30589dd99dcSXin LI 				/* XXX - Incorrect if several '\b' in a row.  */
30689dd99dcSXin LI 				width = (utf_mode && is_wide_char(prev_ch)) ? -2 : -1;
30789dd99dcSXin LI 			else if (!control_char(c))
30889dd99dcSXin LI 				width = 1;
30989dd99dcSXin LI 			prev_ch = 0;
31089dd99dcSXin LI 		}
31189dd99dcSXin LI 
31289dd99dcSXin LI 		if (width == 2 && shift - shifted == 1) {
31389dd99dcSXin LI 			/* Should never happen when called by pshift_all().  */
31489dd99dcSXin LI 			attr[to] = attr[from];
31589dd99dcSXin LI 			/*
31689dd99dcSXin LI 			 * Assume a wide_char will never be the first half of a
31789dd99dcSXin LI 			 * combining_char pair, so reset prev_ch in case we're
31889dd99dcSXin LI 			 * followed by a '\b'.
31989dd99dcSXin LI 			 */
32089dd99dcSXin LI 			prev_ch = linebuf[to++] = ' ';
32189dd99dcSXin LI 			from += len;
32289dd99dcSXin LI 			shifted++;
32389dd99dcSXin LI 			continue;
32489dd99dcSXin LI 		}
32589dd99dcSXin LI 
32689dd99dcSXin LI 		/* Adjust width for magic cookies. */
32789dd99dcSXin LI 		prev_attr = (to > 0) ? attr[to-1] : AT_NORMAL;
32889dd99dcSXin LI 		next_attr = (from + len < curr) ? attr[from + len] : prev_attr;
32989dd99dcSXin LI 		if (!is_at_equiv(attr[from], prev_attr) &&
33089dd99dcSXin LI 			!is_at_equiv(attr[from], next_attr))
33189dd99dcSXin LI 		{
33289dd99dcSXin LI 			width += attr_swidth(attr[from]);
33389dd99dcSXin LI 			if (from + len < curr)
33489dd99dcSXin LI 				width += attr_ewidth(attr[from]);
33589dd99dcSXin LI 			if (is_at_equiv(prev_attr, next_attr))
33689dd99dcSXin LI 			{
33789dd99dcSXin LI 				width += attr_ewidth(prev_attr);
33889dd99dcSXin LI 				if (from + len < curr)
33989dd99dcSXin LI 					width += attr_swidth(next_attr);
34089dd99dcSXin LI 			}
34189dd99dcSXin LI 		}
34289dd99dcSXin LI 
34389dd99dcSXin LI 		if (shift - shifted < width)
34489dd99dcSXin LI 			break;
34589dd99dcSXin LI 		from += len;
34689dd99dcSXin LI 		shifted += width;
34789dd99dcSXin LI 		if (shifted < 0)
34889dd99dcSXin LI 			shifted = 0;
34989dd99dcSXin LI 	}
35089dd99dcSXin LI 	while (from < curr)
35189dd99dcSXin LI 	{
35289dd99dcSXin LI 		linebuf[to] = linebuf[from];
35389dd99dcSXin LI 		attr[to++] = attr[from++];
35489dd99dcSXin LI 	}
35589dd99dcSXin LI 	curr = to;
35689dd99dcSXin LI 	column -= shifted;
35789dd99dcSXin LI 	cshift += shifted;
35889dd99dcSXin LI }
35989dd99dcSXin LI 
36089dd99dcSXin LI /*
36189dd99dcSXin LI  *
36289dd99dcSXin LI  */
36389dd99dcSXin LI 	public void
36489dd99dcSXin LI pshift_all()
36589dd99dcSXin LI {
36689dd99dcSXin LI 	pshift(column);
367a5f0fb15SPaul Saab }
368a5f0fb15SPaul Saab 
369a5f0fb15SPaul Saab /*
370a5f0fb15SPaul Saab  * Return the printing width of the start (enter) sequence
371a5f0fb15SPaul Saab  * for a given character attribute.
372a5f0fb15SPaul Saab  */
373a5f0fb15SPaul Saab 	static int
374a5f0fb15SPaul Saab attr_swidth(a)
375a5f0fb15SPaul Saab 	int a;
376a5f0fb15SPaul Saab {
37789dd99dcSXin LI 	int w = 0;
37889dd99dcSXin LI 
37989dd99dcSXin LI 	a = apply_at_specials(a);
38089dd99dcSXin LI 
38189dd99dcSXin LI 	if (a & AT_UNDERLINE)
38289dd99dcSXin LI 		w += ul_s_width;
38389dd99dcSXin LI 	if (a & AT_BOLD)
38489dd99dcSXin LI 		w += bo_s_width;
38589dd99dcSXin LI 	if (a & AT_BLINK)
38689dd99dcSXin LI 		w += bl_s_width;
38789dd99dcSXin LI 	if (a & AT_STANDOUT)
38889dd99dcSXin LI 		w += so_s_width;
38989dd99dcSXin LI 
39089dd99dcSXin LI 	return w;
391a5f0fb15SPaul Saab }
392a5f0fb15SPaul Saab 
393a5f0fb15SPaul Saab /*
394a5f0fb15SPaul Saab  * Return the printing width of the end (exit) sequence
395a5f0fb15SPaul Saab  * for a given character attribute.
396a5f0fb15SPaul Saab  */
397a5f0fb15SPaul Saab 	static int
398a5f0fb15SPaul Saab attr_ewidth(a)
399a5f0fb15SPaul Saab 	int a;
400a5f0fb15SPaul Saab {
40189dd99dcSXin LI 	int w = 0;
40289dd99dcSXin LI 
40389dd99dcSXin LI 	a = apply_at_specials(a);
40489dd99dcSXin LI 
40589dd99dcSXin LI 	if (a & AT_UNDERLINE)
40689dd99dcSXin LI 		w += ul_e_width;
40789dd99dcSXin LI 	if (a & AT_BOLD)
40889dd99dcSXin LI 		w += bo_e_width;
40989dd99dcSXin LI 	if (a & AT_BLINK)
41089dd99dcSXin LI 		w += bl_e_width;
41189dd99dcSXin LI 	if (a & AT_STANDOUT)
41289dd99dcSXin LI 		w += so_e_width;
41389dd99dcSXin LI 
41489dd99dcSXin LI 	return w;
415a5f0fb15SPaul Saab }
416a5f0fb15SPaul Saab 
417a5f0fb15SPaul Saab /*
418a5f0fb15SPaul Saab  * Return the printing width of a given character and attribute,
419a5f0fb15SPaul Saab  * if the character were added to the current position in the line buffer.
420a5f0fb15SPaul Saab  * Adding a character with a given attribute may cause an enter or exit
421a5f0fb15SPaul Saab  * attribute sequence to be inserted, so this must be taken into account.
422a5f0fb15SPaul Saab  */
423a5f0fb15SPaul Saab 	static int
42489dd99dcSXin LI pwidth(ch, a, prev_ch)
42589dd99dcSXin LI 	LWCHAR ch;
426a5f0fb15SPaul Saab 	int a;
42789dd99dcSXin LI 	LWCHAR prev_ch;
428a5f0fb15SPaul Saab {
42989dd99dcSXin LI 	int w;
430a5f0fb15SPaul Saab 
43189dd99dcSXin LI 	if (ch == '\b')
432a5f0fb15SPaul Saab 		/*
43389dd99dcSXin LI 		 * Backspace moves backwards one or two positions.
43489dd99dcSXin LI 		 * XXX - Incorrect if several '\b' in a row.
435a5f0fb15SPaul Saab 		 */
43689dd99dcSXin LI 		return (utf_mode && is_wide_char(prev_ch)) ? -2 : -1;
437a5f0fb15SPaul Saab 
43889dd99dcSXin LI 	if (!utf_mode || is_ascii_char(ch))
43989dd99dcSXin LI 	{
44089dd99dcSXin LI 		if (control_char((char)ch))
44189dd99dcSXin LI 		{
442a5f0fb15SPaul Saab 			/*
44389dd99dcSXin LI 			 * Control characters do unpredictable things,
444a5f0fb15SPaul Saab 			 * so we don't even try to guess; say it doesn't move.
445a5f0fb15SPaul Saab 			 * This can only happen if the -r flag is in effect.
446a5f0fb15SPaul Saab 			 */
447a5f0fb15SPaul Saab 			return (0);
44889dd99dcSXin LI 		}
44989dd99dcSXin LI 	} else
45089dd99dcSXin LI 	{
45189dd99dcSXin LI 		if (is_composing_char(ch) || is_combining_char(prev_ch, ch))
45289dd99dcSXin LI 		{
45389dd99dcSXin LI 			/*
45489dd99dcSXin LI 			 * Composing and combining chars take up no space.
45589dd99dcSXin LI 			 *
45689dd99dcSXin LI 			 * Some terminals, upon failure to compose a
45789dd99dcSXin LI 			 * composing character with the character(s) that
45889dd99dcSXin LI 			 * precede(s) it will actually take up one column
45989dd99dcSXin LI 			 * for the composing character; there isn't much
46089dd99dcSXin LI 			 * we could do short of testing the (complex)
46189dd99dcSXin LI 			 * composition process ourselves and printing
46289dd99dcSXin LI 			 * a binary representation when it fails.
46389dd99dcSXin LI 			 */
46489dd99dcSXin LI 			return (0);
46589dd99dcSXin LI 		}
46689dd99dcSXin LI 	}
467a5f0fb15SPaul Saab 
468a5f0fb15SPaul Saab 	/*
46989dd99dcSXin LI 	 * Other characters take one or two columns,
470a5f0fb15SPaul Saab 	 * plus the width of any attribute enter/exit sequence.
471a5f0fb15SPaul Saab 	 */
472a5f0fb15SPaul Saab 	w = 1;
47389dd99dcSXin LI 	if (is_wide_char(ch))
47489dd99dcSXin LI 		w++;
47589dd99dcSXin LI 	if (curr > 0 && !is_at_equiv(attr[curr-1], a))
476a5f0fb15SPaul Saab 		w += attr_ewidth(attr[curr-1]);
47789dd99dcSXin LI 	if ((apply_at_specials(a) != AT_NORMAL) &&
47889dd99dcSXin LI 	    (curr == 0 || !is_at_equiv(attr[curr-1], a)))
479a5f0fb15SPaul Saab 		w += attr_swidth(a);
480a5f0fb15SPaul Saab 	return (w);
481a5f0fb15SPaul Saab }
482a5f0fb15SPaul Saab 
483a5f0fb15SPaul Saab /*
48489dd99dcSXin LI  * Delete to the previous base character in the line buffer.
48589dd99dcSXin LI  * Return 1 if one is found.
486a5f0fb15SPaul Saab  */
48789dd99dcSXin LI 	static int
488a5f0fb15SPaul Saab backc()
489a5f0fb15SPaul Saab {
49089dd99dcSXin LI 	LWCHAR prev_ch;
49189dd99dcSXin LI 	char *p = linebuf + curr;
49289dd99dcSXin LI 	LWCHAR ch = step_char(&p, -1, linebuf + lmargin);
49389dd99dcSXin LI 	int width;
49489dd99dcSXin LI 
49589dd99dcSXin LI 	/* This assumes that there is no '\b' in linebuf.  */
49689dd99dcSXin LI 	while (   curr > lmargin
49789dd99dcSXin LI 	       && column > lmargin
49889dd99dcSXin LI 	       && (!(attr[curr - 1] & (AT_ANSI|AT_BINARY))))
49989dd99dcSXin LI 	{
50089dd99dcSXin LI 		curr = p - linebuf;
50189dd99dcSXin LI 		prev_ch = step_char(&p, -1, linebuf + lmargin);
50289dd99dcSXin LI 		width = pwidth(ch, attr[curr], prev_ch);
50389dd99dcSXin LI 		column -= width;
50489dd99dcSXin LI 		if (width > 0)
50589dd99dcSXin LI 			return 1;
50689dd99dcSXin LI 		ch = prev_ch;
50789dd99dcSXin LI 	}
50889dd99dcSXin LI 
50989dd99dcSXin LI 	return 0;
510a5f0fb15SPaul Saab }
511a5f0fb15SPaul Saab 
512a5f0fb15SPaul Saab /*
513a5f0fb15SPaul Saab  * Are we currently within a recognized ANSI escape sequence?
514a5f0fb15SPaul Saab  */
515a5f0fb15SPaul Saab 	static int
516a5f0fb15SPaul Saab in_ansi_esc_seq()
517a5f0fb15SPaul Saab {
51889dd99dcSXin LI 	char *p;
519a5f0fb15SPaul Saab 
520a5f0fb15SPaul Saab 	/*
521a5f0fb15SPaul Saab 	 * Search backwards for either an ESC (which means we ARE in a seq);
522a5f0fb15SPaul Saab 	 * or an end char (which means we're NOT in a seq).
523a5f0fb15SPaul Saab 	 */
52489dd99dcSXin LI 	for (p = &linebuf[curr];  p > linebuf; )
525a5f0fb15SPaul Saab 	{
52689dd99dcSXin LI 		LWCHAR ch = step_char(&p, -1, linebuf);
52789dd99dcSXin LI 		if (ch == ESC)
528a5f0fb15SPaul Saab 			return (1);
52989dd99dcSXin LI 		if (!is_ansi_middle(ch))
530a5f0fb15SPaul Saab 			return (0);
531a5f0fb15SPaul Saab 	}
532a5f0fb15SPaul Saab 	return (0);
533a5f0fb15SPaul Saab }
534a5f0fb15SPaul Saab 
535a5f0fb15SPaul Saab /*
536c9346414SPaul Saab  * Is a character the end of an ANSI escape sequence?
537c9346414SPaul Saab  */
538c9346414SPaul Saab 	public int
53989dd99dcSXin LI is_ansi_end(ch)
54089dd99dcSXin LI 	LWCHAR ch;
541c9346414SPaul Saab {
54289dd99dcSXin LI 	if (!is_ascii_char(ch))
54389dd99dcSXin LI 		return (0);
54489dd99dcSXin LI 	return (strchr(end_ansi_chars, (char) ch) != NULL);
54589dd99dcSXin LI }
54689dd99dcSXin LI 
54789dd99dcSXin LI /*
54889dd99dcSXin LI  *
54989dd99dcSXin LI  */
55089dd99dcSXin LI 	public int
55189dd99dcSXin LI is_ansi_middle(ch)
55289dd99dcSXin LI 	LWCHAR ch;
55389dd99dcSXin LI {
55489dd99dcSXin LI 	if (!is_ascii_char(ch))
55589dd99dcSXin LI 		return (0);
55689dd99dcSXin LI 	if (is_ansi_end(ch))
55789dd99dcSXin LI 		return (0);
55889dd99dcSXin LI 	return (strchr(mid_ansi_chars, (char) ch) != NULL);
559c9346414SPaul Saab }
560c9346414SPaul Saab 
561c9346414SPaul Saab /*
562a5f0fb15SPaul Saab  * Append a character and attribute to the line buffer.
563a5f0fb15SPaul Saab  */
56489dd99dcSXin LI #define	STORE_CHAR(ch,a,rep,pos) \
56589dd99dcSXin LI 	do { \
56689dd99dcSXin LI 		if (store_char((ch),(a),(rep),(pos))) return (1); \
56789dd99dcSXin LI 	} while (0)
568c9346414SPaul Saab 
569a5f0fb15SPaul Saab 	static int
57089dd99dcSXin LI store_char(ch, a, rep, pos)
57189dd99dcSXin LI 	LWCHAR ch;
572a5f0fb15SPaul Saab 	int a;
57389dd99dcSXin LI 	char *rep;
574a5f0fb15SPaul Saab 	POSITION pos;
575a5f0fb15SPaul Saab {
57689dd99dcSXin LI 	int w;
57789dd99dcSXin LI 	int replen;
57889dd99dcSXin LI 	char cs;
579a5f0fb15SPaul Saab 
58089dd99dcSXin LI 	w = (a & (AT_UNDERLINE|AT_BOLD));	/* Pre-use w.  */
58189dd99dcSXin LI 	if (w != AT_NORMAL)
58289dd99dcSXin LI 		last_overstrike = w;
58389dd99dcSXin LI 
584a5f0fb15SPaul Saab #if HILITE_SEARCH
58589dd99dcSXin LI 	{
58689dd99dcSXin LI 		int matches;
58789dd99dcSXin LI 		if (is_hilited(pos, pos+1, 0, &matches))
588c9346414SPaul Saab 		{
589a5f0fb15SPaul Saab 			/*
590a5f0fb15SPaul Saab 			 * This character should be highlighted.
591a5f0fb15SPaul Saab 			 * Override the attribute passed in.
592a5f0fb15SPaul Saab 			 */
59389dd99dcSXin LI 			if (a != AT_ANSI)
59489dd99dcSXin LI 				a |= AT_HILITE;
59589dd99dcSXin LI 		}
59689dd99dcSXin LI 		line_matches += matches;
597c9346414SPaul Saab 	}
598a5f0fb15SPaul Saab #endif
59989dd99dcSXin LI 
600a5f0fb15SPaul Saab 	if (ctldisp == OPT_ONPLUS && in_ansi_esc_seq())
60189dd99dcSXin LI 	{
60289dd99dcSXin LI 		if (!is_ansi_end(ch) && !is_ansi_middle(ch)) {
60389dd99dcSXin LI 			/* Remove whole unrecognized sequence.  */
60489dd99dcSXin LI 			do {
60589dd99dcSXin LI 				--curr;
60689dd99dcSXin LI 			} while (linebuf[curr] != ESC);
60789dd99dcSXin LI 			return 0;
60889dd99dcSXin LI 		}
60989dd99dcSXin LI 		a = AT_ANSI;	/* Will force re-AT_'ing around it.  */
610a5f0fb15SPaul Saab 		w = 0;
61189dd99dcSXin LI 	}
61289dd99dcSXin LI 	else if (ctldisp == OPT_ONPLUS && ch == ESC)
61389dd99dcSXin LI 	{
61489dd99dcSXin LI 		a = AT_ANSI;	/* Will force re-AT_'ing around it.  */
61589dd99dcSXin LI 		w = 0;
61689dd99dcSXin LI 	}
617a5f0fb15SPaul Saab 	else
61889dd99dcSXin LI 	{
61989dd99dcSXin LI 		char *p = &linebuf[curr];
62089dd99dcSXin LI 		LWCHAR prev_ch = step_char(&p, -1, linebuf);
62189dd99dcSXin LI 		w = pwidth(ch, a, prev_ch);
62289dd99dcSXin LI 	}
62389dd99dcSXin LI 
624a5f0fb15SPaul Saab 	if (ctldisp != OPT_ON && column + w + attr_ewidth(a) > sc_width)
625a5f0fb15SPaul Saab 		/*
626a5f0fb15SPaul Saab 		 * Won't fit on screen.
627a5f0fb15SPaul Saab 		 */
628a5f0fb15SPaul Saab 		return (1);
629a5f0fb15SPaul Saab 
63089dd99dcSXin LI 	if (rep == NULL)
63189dd99dcSXin LI 	{
63289dd99dcSXin LI 		cs = (char) ch;
63389dd99dcSXin LI 		rep = &cs;
63489dd99dcSXin LI 		replen = 1;
63589dd99dcSXin LI 	} else
63689dd99dcSXin LI 	{
63789dd99dcSXin LI 		replen = utf_len(rep[0]);
63889dd99dcSXin LI 	}
63989dd99dcSXin LI 	if (curr + replen >= size_linebuf-6)
640c9346414SPaul Saab 	{
641a5f0fb15SPaul Saab 		/*
642a5f0fb15SPaul Saab 		 * Won't fit in line buffer.
643c9346414SPaul Saab 		 * Try to expand it.
644a5f0fb15SPaul Saab 		 */
645c9346414SPaul Saab 		if (expand_linebuf())
646a5f0fb15SPaul Saab 			return (1);
647c9346414SPaul Saab 	}
648a5f0fb15SPaul Saab 
64989dd99dcSXin LI 	while (replen-- > 0)
650a5f0fb15SPaul Saab 	{
65189dd99dcSXin LI 		linebuf[curr] = *rep++;
652a5f0fb15SPaul Saab 		attr[curr] = a;
65389dd99dcSXin LI 		curr++;
65489dd99dcSXin LI 	}
655a5f0fb15SPaul Saab 	column += w;
656a5f0fb15SPaul Saab 	return (0);
657a5f0fb15SPaul Saab }
658a5f0fb15SPaul Saab 
659a5f0fb15SPaul Saab /*
660c9346414SPaul Saab  * Append a tab to the line buffer.
661c9346414SPaul Saab  * Store spaces to represent the tab.
662c9346414SPaul Saab  */
663c9346414SPaul Saab #define	STORE_TAB(a,pos) \
664c9346414SPaul Saab 	do { if (store_tab((a),(pos))) return (1); } while (0)
665c9346414SPaul Saab 
666c9346414SPaul Saab 	static int
667c9346414SPaul Saab store_tab(attr, pos)
668c9346414SPaul Saab 	int attr;
669c9346414SPaul Saab 	POSITION pos;
670c9346414SPaul Saab {
671c9346414SPaul Saab 	int to_tab = column + cshift - lmargin;
672c9346414SPaul Saab 	int i;
673c9346414SPaul Saab 
674c9346414SPaul Saab 	if (ntabstops < 2 || to_tab >= tabstops[ntabstops-1])
675c9346414SPaul Saab 		to_tab = tabdefault -
676c9346414SPaul Saab 		     ((to_tab - tabstops[ntabstops-1]) % tabdefault);
677c9346414SPaul Saab 	else
678c9346414SPaul Saab 	{
679c9346414SPaul Saab 		for (i = ntabstops - 2;  i >= 0;  i--)
680c9346414SPaul Saab 			if (to_tab >= tabstops[i])
681c9346414SPaul Saab 				break;
682c9346414SPaul Saab 		to_tab = tabstops[i+1] - to_tab;
683c9346414SPaul Saab 	}
684c9346414SPaul Saab 
68589dd99dcSXin LI 	if (column + to_tab - 1 + pwidth(' ', attr, 0) + attr_ewidth(attr) > sc_width)
68689dd99dcSXin LI 		return 1;
68789dd99dcSXin LI 
688c9346414SPaul Saab 	do {
68989dd99dcSXin LI 		STORE_CHAR(' ', attr, " ", pos);
690c9346414SPaul Saab 	} while (--to_tab > 0);
691c9346414SPaul Saab 	return 0;
692c9346414SPaul Saab }
693c9346414SPaul Saab 
69489dd99dcSXin LI #define STORE_PRCHAR(c, pos) \
69589dd99dcSXin LI 	do { if (store_prchar((c), (pos))) return 1; } while (0)
69689dd99dcSXin LI 
69789dd99dcSXin LI 	static int
69889dd99dcSXin LI store_prchar(c, pos)
69989dd99dcSXin LI 	char c;
70089dd99dcSXin LI 	POSITION pos;
70189dd99dcSXin LI {
70289dd99dcSXin LI 	char *s;
70389dd99dcSXin LI 
70489dd99dcSXin LI 	/*
70589dd99dcSXin LI 	 * Convert to printable representation.
70689dd99dcSXin LI 	 */
70789dd99dcSXin LI 	s = prchar(c);
70889dd99dcSXin LI 
70989dd99dcSXin LI 	/*
71089dd99dcSXin LI 	 * Make sure we can get the entire representation
71189dd99dcSXin LI 	 * of the character on this line.
71289dd99dcSXin LI 	 */
71389dd99dcSXin LI 	if (column + (int) strlen(s) - 1 +
71489dd99dcSXin LI             pwidth(' ', binattr, 0) + attr_ewidth(binattr) > sc_width)
71589dd99dcSXin LI 		return 1;
71689dd99dcSXin LI 
71789dd99dcSXin LI 	for ( ;  *s != 0;  s++)
71889dd99dcSXin LI 		STORE_CHAR(*s, AT_BINARY, NULL, pos);
71989dd99dcSXin LI 
72089dd99dcSXin LI 	return 0;
72189dd99dcSXin LI }
72289dd99dcSXin LI 
72389dd99dcSXin LI 	static int
72489dd99dcSXin LI flush_mbc_buf(pos)
72589dd99dcSXin LI 	POSITION pos;
72689dd99dcSXin LI {
72789dd99dcSXin LI 	int i;
72889dd99dcSXin LI 
72989dd99dcSXin LI 	for (i = 0; i < mbc_buf_index; i++)
73089dd99dcSXin LI 		if (store_prchar(mbc_buf[i], pos))
73189dd99dcSXin LI 			return mbc_buf_index - i;
73289dd99dcSXin LI 
73389dd99dcSXin LI 	return 0;
73489dd99dcSXin LI }
73589dd99dcSXin LI 
736c9346414SPaul Saab /*
737a5f0fb15SPaul Saab  * Append a character to the line buffer.
738a5f0fb15SPaul Saab  * Expand tabs into spaces, handle underlining, boldfacing, etc.
739a5f0fb15SPaul Saab  * Returns 0 if ok, 1 if couldn't fit in buffer.
740a5f0fb15SPaul Saab  */
741a5f0fb15SPaul Saab 	public int
742a5f0fb15SPaul Saab pappend(c, pos)
74389dd99dcSXin LI 	char c;
744a5f0fb15SPaul Saab 	POSITION pos;
745a5f0fb15SPaul Saab {
746a5f0fb15SPaul Saab 	int r;
747a5f0fb15SPaul Saab 
748a5f0fb15SPaul Saab 	if (pendc)
749a5f0fb15SPaul Saab 	{
75089dd99dcSXin LI 		if (do_append(pendc, NULL, pendpos))
751a5f0fb15SPaul Saab 			/*
752a5f0fb15SPaul Saab 			 * Oops.  We've probably lost the char which
753a5f0fb15SPaul Saab 			 * was in pendc, since caller won't back up.
754a5f0fb15SPaul Saab 			 */
755a5f0fb15SPaul Saab 			return (1);
756a5f0fb15SPaul Saab 		pendc = '\0';
757a5f0fb15SPaul Saab 	}
758a5f0fb15SPaul Saab 
759a5f0fb15SPaul Saab 	if (c == '\r' && bs_mode == BS_SPECIAL)
760a5f0fb15SPaul Saab 	{
76189dd99dcSXin LI 		if (mbc_buf_len > 0)  /* utf_mode must be on. */
76289dd99dcSXin LI 		{
76389dd99dcSXin LI 			/* Flush incomplete (truncated) sequence. */
76489dd99dcSXin LI 			r = flush_mbc_buf(mbc_pos);
76589dd99dcSXin LI 			mbc_buf_index = r + 1;
76689dd99dcSXin LI 			mbc_buf_len = 0;
76789dd99dcSXin LI 			if (r)
76889dd99dcSXin LI 				return (mbc_buf_index);
76989dd99dcSXin LI 		}
77089dd99dcSXin LI 
771a5f0fb15SPaul Saab 		/*
772a5f0fb15SPaul Saab 		 * Don't put the CR into the buffer until we see
773a5f0fb15SPaul Saab 		 * the next char.  If the next char is a newline,
774a5f0fb15SPaul Saab 		 * discard the CR.
775a5f0fb15SPaul Saab 		 */
776a5f0fb15SPaul Saab 		pendc = c;
777a5f0fb15SPaul Saab 		pendpos = pos;
778a5f0fb15SPaul Saab 		return (0);
779a5f0fb15SPaul Saab 	}
780a5f0fb15SPaul Saab 
78189dd99dcSXin LI 	if (!utf_mode)
78289dd99dcSXin LI 	{
78389dd99dcSXin LI 		r = do_append((LWCHAR) c, NULL, pos);
78489dd99dcSXin LI 	} else
78589dd99dcSXin LI 	{
78689dd99dcSXin LI 		/* Perform strict validation in all possible cases. */
78789dd99dcSXin LI 		if (mbc_buf_len == 0)
78889dd99dcSXin LI 		{
78989dd99dcSXin LI 		retry:
79089dd99dcSXin LI 			mbc_buf_index = 1;
79189dd99dcSXin LI 			*mbc_buf = c;
79289dd99dcSXin LI 			if (IS_ASCII_OCTET(c))
79389dd99dcSXin LI 				r = do_append((LWCHAR) c, NULL, pos);
79489dd99dcSXin LI 			else if (IS_UTF8_LEAD(c))
79589dd99dcSXin LI 			{
79689dd99dcSXin LI 				mbc_buf_len = utf_len(c);
79789dd99dcSXin LI 				mbc_pos = pos;
79889dd99dcSXin LI 				return (0);
79989dd99dcSXin LI 			} else
80089dd99dcSXin LI 				/* UTF8_INVALID or stray UTF8_TRAIL */
80189dd99dcSXin LI 				r = flush_mbc_buf(pos);
80289dd99dcSXin LI 		} else if (IS_UTF8_TRAIL(c))
80389dd99dcSXin LI 		{
80489dd99dcSXin LI 			mbc_buf[mbc_buf_index++] = c;
80589dd99dcSXin LI 			if (mbc_buf_index < mbc_buf_len)
80689dd99dcSXin LI 				return (0);
80789dd99dcSXin LI 			if (is_utf8_well_formed(mbc_buf))
80889dd99dcSXin LI 				r = do_append(get_wchar(mbc_buf), mbc_buf, mbc_pos);
80989dd99dcSXin LI 			else
81089dd99dcSXin LI 				/* Complete, but not shortest form, sequence. */
81189dd99dcSXin LI 				mbc_buf_index = r = flush_mbc_buf(mbc_pos);
81289dd99dcSXin LI 			mbc_buf_len = 0;
81389dd99dcSXin LI 		} else
81489dd99dcSXin LI 		{
81589dd99dcSXin LI 			/* Flush incomplete (truncated) sequence.  */
81689dd99dcSXin LI 			r = flush_mbc_buf(mbc_pos);
81789dd99dcSXin LI 			mbc_buf_index = r + 1;
81889dd99dcSXin LI 			mbc_buf_len = 0;
81989dd99dcSXin LI 			/* Handle new char.  */
82089dd99dcSXin LI 			if (!r)
82189dd99dcSXin LI 				goto retry;
82289dd99dcSXin LI  		}
82389dd99dcSXin LI 	}
82489dd99dcSXin LI 
825a5f0fb15SPaul Saab 	/*
826a5f0fb15SPaul Saab 	 * If we need to shift the line, do it.
827a5f0fb15SPaul Saab 	 * But wait until we get to at least the middle of the screen,
828a5f0fb15SPaul Saab 	 * so shifting it doesn't affect the chars we're currently
829a5f0fb15SPaul Saab 	 * pappending.  (Bold & underline can get messed up otherwise.)
830a5f0fb15SPaul Saab 	 */
831a5f0fb15SPaul Saab 	if (cshift < hshift && column > sc_width / 2)
832c9346414SPaul Saab 	{
833c9346414SPaul Saab 		linebuf[curr] = '\0';
834a5f0fb15SPaul Saab 		pshift(hshift - cshift);
835c9346414SPaul Saab 	}
83689dd99dcSXin LI 	if (r)
83789dd99dcSXin LI 	{
83889dd99dcSXin LI 		/* How many chars should caller back up? */
83989dd99dcSXin LI 		r = (!utf_mode) ? 1 : mbc_buf_index;
84089dd99dcSXin LI 	}
841a5f0fb15SPaul Saab 	return (r);
842a5f0fb15SPaul Saab }
843a5f0fb15SPaul Saab 
844a5f0fb15SPaul Saab 	static int
84589dd99dcSXin LI do_append(ch, rep, pos)
84689dd99dcSXin LI 	LWCHAR ch;
84789dd99dcSXin LI 	char *rep;
848a5f0fb15SPaul Saab 	POSITION pos;
849a5f0fb15SPaul Saab {
850a5f0fb15SPaul Saab 	register int a;
85189dd99dcSXin LI 	LWCHAR prev_ch;
852a5f0fb15SPaul Saab 
85389dd99dcSXin LI 	a = AT_NORMAL;
854a5f0fb15SPaul Saab 
85589dd99dcSXin LI 	if (ch == '\b')
856a5f0fb15SPaul Saab 	{
85789dd99dcSXin LI 		if (bs_mode == BS_CONTROL)
858a5f0fb15SPaul Saab 			goto do_control_char;
85989dd99dcSXin LI 
86089dd99dcSXin LI 		/*
86189dd99dcSXin LI 		 * A better test is needed here so we don't
86289dd99dcSXin LI 		 * backspace over part of the printed
86389dd99dcSXin LI 		 * representation of a binary character.
86489dd99dcSXin LI 		 */
86589dd99dcSXin LI 		if (   curr <= lmargin
86689dd99dcSXin LI 		    || column <= lmargin
86789dd99dcSXin LI 		    || (attr[curr - 1] & (AT_ANSI|AT_BINARY)))
86889dd99dcSXin LI 			STORE_PRCHAR('\b', pos);
86989dd99dcSXin LI 		else if (bs_mode == BS_NORMAL)
87089dd99dcSXin LI 			STORE_CHAR(ch, AT_NORMAL, NULL, pos);
87189dd99dcSXin LI 		else if (bs_mode == BS_SPECIAL)
87289dd99dcSXin LI 			overstrike = backc();
87389dd99dcSXin LI 
87489dd99dcSXin LI 		return 0;
875a5f0fb15SPaul Saab 	}
87689dd99dcSXin LI 
87789dd99dcSXin LI 	if (overstrike > 0)
878a5f0fb15SPaul Saab 	{
879a5f0fb15SPaul Saab 		/*
880a5f0fb15SPaul Saab 		 * Overstrike the character at the current position
881a5f0fb15SPaul Saab 		 * in the line buffer.  This will cause either
882a5f0fb15SPaul Saab 		 * underline (if a "_" is overstruck),
883a5f0fb15SPaul Saab 		 * bold (if an identical character is overstruck),
884a5f0fb15SPaul Saab 		 * or just deletion of the character in the buffer.
885a5f0fb15SPaul Saab 		 */
88689dd99dcSXin LI 		overstrike = utf_mode ? -1 : 0;
88789dd99dcSXin LI 		/* To be correct, this must be a base character.  */
88889dd99dcSXin LI 		prev_ch = get_wchar(linebuf + curr);
88989dd99dcSXin LI 		a = attr[curr];
89089dd99dcSXin LI 		if (ch == prev_ch)
891c9346414SPaul Saab 		{
892000ba3e8STim J. Robbins 			/*
893000ba3e8STim J. Robbins 			 * Overstriking a char with itself means make it bold.
894000ba3e8STim J. Robbins 			 * But overstriking an underscore with itself is
895000ba3e8STim J. Robbins 			 * ambiguous.  It could mean make it bold, or
896000ba3e8STim J. Robbins 			 * it could mean make it underlined.
897000ba3e8STim J. Robbins 			 * Use the previous overstrike to resolve it.
898000ba3e8STim J. Robbins 			 */
89989dd99dcSXin LI 			if (ch == '_')
90089dd99dcSXin LI 			{
90189dd99dcSXin LI 				if ((a & (AT_BOLD|AT_UNDERLINE)) != AT_NORMAL)
90289dd99dcSXin LI 					a |= (AT_BOLD|AT_UNDERLINE);
90389dd99dcSXin LI 				else if (last_overstrike != AT_NORMAL)
90489dd99dcSXin LI 					a |= last_overstrike;
905000ba3e8STim J. Robbins 				else
90689dd99dcSXin LI 					a |= AT_BOLD;
90789dd99dcSXin LI 			} else
90889dd99dcSXin LI 				a |= AT_BOLD;
90989dd99dcSXin LI 		} else if (ch == '_')
910c9346414SPaul Saab 		{
91189dd99dcSXin LI 			a |= AT_UNDERLINE;
91289dd99dcSXin LI 			ch = prev_ch;
91389dd99dcSXin LI 			rep = linebuf + curr;
91489dd99dcSXin LI 		} else if (prev_ch == '_')
915c9346414SPaul Saab 		{
91689dd99dcSXin LI 			a |= AT_UNDERLINE;
917000ba3e8STim J. Robbins 		}
91889dd99dcSXin LI 		/* Else we replace prev_ch, but we keep its attributes.  */
91989dd99dcSXin LI 	} else if (overstrike < 0)
920c9346414SPaul Saab 	{
92189dd99dcSXin LI 		if (   is_composing_char(ch)
92289dd99dcSXin LI 		    || is_combining_char(get_wchar(linebuf + curr), ch))
92389dd99dcSXin LI 			/* Continuation of the same overstrike.  */
92489dd99dcSXin LI 			a = last_overstrike;
925a5f0fb15SPaul Saab 		else
92689dd99dcSXin LI 			overstrike = 0;
92789dd99dcSXin LI 	}
92889dd99dcSXin LI 
92989dd99dcSXin LI 	if (ch == '\t')
930a5f0fb15SPaul Saab 	{
931a5f0fb15SPaul Saab 		/*
932a5f0fb15SPaul Saab 		 * Expand a tab into spaces.
933a5f0fb15SPaul Saab 		 */
934a5f0fb15SPaul Saab 		switch (bs_mode)
935a5f0fb15SPaul Saab 		{
936a5f0fb15SPaul Saab 		case BS_CONTROL:
937a5f0fb15SPaul Saab 			goto do_control_char;
938a5f0fb15SPaul Saab 		case BS_NORMAL:
939a5f0fb15SPaul Saab 		case BS_SPECIAL:
94089dd99dcSXin LI 			STORE_TAB(a, pos);
941a5f0fb15SPaul Saab 			break;
942a5f0fb15SPaul Saab 		}
94389dd99dcSXin LI 	} else if ((!utf_mode || is_ascii_char(ch)) && control_char((char)ch))
944a5f0fb15SPaul Saab 	{
945a5f0fb15SPaul Saab 	do_control_char:
94689dd99dcSXin LI 		if (ctldisp == OPT_ON || (ctldisp == OPT_ONPLUS && ch == ESC))
947a5f0fb15SPaul Saab 		{
948a5f0fb15SPaul Saab 			/*
949a5f0fb15SPaul Saab 			 * Output as a normal character.
950a5f0fb15SPaul Saab 			 */
95189dd99dcSXin LI 			STORE_CHAR(ch, AT_NORMAL, rep, pos);
952a5f0fb15SPaul Saab 		} else
953a5f0fb15SPaul Saab 		{
95489dd99dcSXin LI 			STORE_PRCHAR((char) ch, pos);
95589dd99dcSXin LI 		}
95689dd99dcSXin LI 	} else if (utf_mode && ctldisp != OPT_ON && is_ubin_char(ch))
95789dd99dcSXin LI 	{
95889dd99dcSXin LI 		char *s;
959a5f0fb15SPaul Saab 
96089dd99dcSXin LI 		s = prutfchar(ch);
96189dd99dcSXin LI 
96289dd99dcSXin LI 		if (column + (int) strlen(s) - 1 +
96389dd99dcSXin LI 		    pwidth(' ', binattr, 0) + attr_ewidth(binattr) > sc_width)
964a5f0fb15SPaul Saab 			return (1);
965a5f0fb15SPaul Saab 
966a5f0fb15SPaul Saab 		for ( ;  *s != 0;  s++)
96789dd99dcSXin LI 			STORE_CHAR(*s, AT_BINARY, NULL, pos);
968a5f0fb15SPaul Saab  	} else
969a5f0fb15SPaul Saab 	{
97089dd99dcSXin LI 		STORE_CHAR(ch, a, rep, pos);
97189dd99dcSXin LI 	}
97289dd99dcSXin LI  	return (0);
973a5f0fb15SPaul Saab }
974a5f0fb15SPaul Saab 
97589dd99dcSXin LI /*
97689dd99dcSXin LI  *
97789dd99dcSXin LI  */
97889dd99dcSXin LI 	public int
97989dd99dcSXin LI pflushmbc()
98089dd99dcSXin LI {
98189dd99dcSXin LI 	int r = 0;
98289dd99dcSXin LI 
98389dd99dcSXin LI 	if (mbc_buf_len > 0)
98489dd99dcSXin LI 	{
98589dd99dcSXin LI 		/* Flush incomplete (truncated) sequence.  */
98689dd99dcSXin LI 		r = flush_mbc_buf(mbc_pos);
98789dd99dcSXin LI 		mbc_buf_len = 0;
98889dd99dcSXin LI 	}
98989dd99dcSXin LI 	return r;
990a5f0fb15SPaul Saab }
991a5f0fb15SPaul Saab 
992a5f0fb15SPaul Saab /*
993a5f0fb15SPaul Saab  * Terminate the line in the line buffer.
994a5f0fb15SPaul Saab  */
995a5f0fb15SPaul Saab 	public void
996a5f0fb15SPaul Saab pdone(endline)
997a5f0fb15SPaul Saab 	int endline;
998a5f0fb15SPaul Saab {
999720c436cSXin LI 	int nl;
1000720c436cSXin LI 
100189dd99dcSXin LI 	(void) pflushmbc();
100289dd99dcSXin LI 
1003a5f0fb15SPaul Saab 	if (pendc && (pendc != '\r' || !endline))
1004a5f0fb15SPaul Saab 		/*
1005a5f0fb15SPaul Saab 		 * If we had a pending character, put it in the buffer.
1006a5f0fb15SPaul Saab 		 * But discard a pending CR if we are at end of line
1007a5f0fb15SPaul Saab 		 * (that is, discard the CR in a CR/LF sequence).
1008a5f0fb15SPaul Saab 		 */
100989dd99dcSXin LI 		(void) do_append(pendc, NULL, pendpos);
1010a5f0fb15SPaul Saab 
1011a5f0fb15SPaul Saab 	/*
1012a5f0fb15SPaul Saab 	 * Make sure we've shifted the line, if we need to.
1013a5f0fb15SPaul Saab 	 */
1014a5f0fb15SPaul Saab 	if (cshift < hshift)
1015a5f0fb15SPaul Saab 		pshift(hshift - cshift);
1016a5f0fb15SPaul Saab 
101789dd99dcSXin LI 	if (ctldisp == OPT_ONPLUS && is_ansi_end('m'))
101889dd99dcSXin LI 	{
101989dd99dcSXin LI 		/* Switch to normal attribute at end of line. */
102089dd99dcSXin LI 		char *p = "\033[m";
102189dd99dcSXin LI 		for ( ;  *p != '\0';  p++)
102289dd99dcSXin LI 		{
102389dd99dcSXin LI 			linebuf[curr] = *p;
102489dd99dcSXin LI 			attr[curr++] = AT_ANSI;
102589dd99dcSXin LI 		}
102689dd99dcSXin LI 	}
102789dd99dcSXin LI 
1028a5f0fb15SPaul Saab 	/*
1029a5f0fb15SPaul Saab 	 * Add a newline if necessary,
1030a5f0fb15SPaul Saab 	 * and append a '\0' to the end of the line.
1031720c436cSXin LI 	 * We output a newline if we're not at the right edge of the screen,
1032720c436cSXin LI 	 * or if the terminal doesn't auto wrap,
1033720c436cSXin LI 	 * or if this is really the end of the line AND the terminal ignores
1034720c436cSXin LI 	 * a newline at the right edge.
1035720c436cSXin LI 	 * (In the last case we don't want to output a newline if the terminal
1036720c436cSXin LI 	 * doesn't ignore it since that would produce an extra blank line.
1037720c436cSXin LI 	 * But we do want to output a newline if the terminal ignores it in case
1038720c436cSXin LI 	 * the next line is blank.  In that case the single newline output for
1039720c436cSXin LI 	 * that blank line would be ignored!)
1040a5f0fb15SPaul Saab 	 */
1041720c436cSXin LI 	if (!oldbot)
1042720c436cSXin LI 		nl = (column < sc_width || !auto_wrap || (endline && ignaw) || ctldisp == OPT_ON);
1043720c436cSXin LI 	else
1044720c436cSXin LI 		nl = (column < sc_width || !auto_wrap || ignaw || ctldisp == OPT_ON);
1045720c436cSXin LI 	if (nl)
1046a5f0fb15SPaul Saab 	{
1047a5f0fb15SPaul Saab 		linebuf[curr] = '\n';
1048a5f0fb15SPaul Saab 		attr[curr] = AT_NORMAL;
1049a5f0fb15SPaul Saab 		curr++;
1050a5f0fb15SPaul Saab 	}
1051a5f0fb15SPaul Saab 	linebuf[curr] = '\0';
1052a5f0fb15SPaul Saab 	attr[curr] = AT_NORMAL;
1053c9346414SPaul Saab 
1054c9346414SPaul Saab #if HILITE_SEARCH
105589dd99dcSXin LI 	if (status_col && line_matches > 0)
1056c9346414SPaul Saab 	{
1057c9346414SPaul Saab 		linebuf[0] = '*';
105889dd99dcSXin LI 		attr[0] = AT_NORMAL|AT_HILITE;
1059c9346414SPaul Saab 	}
1060c9346414SPaul Saab #endif
1061a5f0fb15SPaul Saab }
1062a5f0fb15SPaul Saab 
1063a5f0fb15SPaul Saab /*
1064a5f0fb15SPaul Saab  * Get a character from the current line.
1065a5f0fb15SPaul Saab  * Return the character as the function return value,
1066a5f0fb15SPaul Saab  * and the character attribute in *ap.
1067a5f0fb15SPaul Saab  */
1068a5f0fb15SPaul Saab 	public int
1069a5f0fb15SPaul Saab gline(i, ap)
1070a5f0fb15SPaul Saab 	register int i;
1071a5f0fb15SPaul Saab 	register int *ap;
1072a5f0fb15SPaul Saab {
1073a5f0fb15SPaul Saab 	if (is_null_line)
1074a5f0fb15SPaul Saab 	{
1075a5f0fb15SPaul Saab 		/*
1076a5f0fb15SPaul Saab 		 * If there is no current line, we pretend the line is
1077a5f0fb15SPaul Saab 		 * either "~" or "", depending on the "twiddle" flag.
1078a5f0fb15SPaul Saab 		 */
107989dd99dcSXin LI 		if (twiddle)
108089dd99dcSXin LI 		{
108189dd99dcSXin LI 			if (i == 0)
108289dd99dcSXin LI 			{
1083a5f0fb15SPaul Saab 				*ap = AT_BOLD;
108489dd99dcSXin LI 				return '~';
108589dd99dcSXin LI 			}
108689dd99dcSXin LI 			--i;
108789dd99dcSXin LI 		}
108889dd99dcSXin LI 		/* Make sure we're back to AT_NORMAL before the '\n'.  */
108989dd99dcSXin LI 		*ap = AT_NORMAL;
109089dd99dcSXin LI 		return i ? '\0' : '\n';
1091a5f0fb15SPaul Saab 	}
1092a5f0fb15SPaul Saab 
1093a5f0fb15SPaul Saab 	*ap = attr[i];
109489dd99dcSXin LI 	return (linebuf[i] & 0xFF);
1095a5f0fb15SPaul Saab }
1096a5f0fb15SPaul Saab 
1097a5f0fb15SPaul Saab /*
1098a5f0fb15SPaul Saab  * Indicate that there is no current line.
1099a5f0fb15SPaul Saab  */
1100a5f0fb15SPaul Saab 	public void
1101a5f0fb15SPaul Saab null_line()
1102a5f0fb15SPaul Saab {
1103a5f0fb15SPaul Saab 	is_null_line = 1;
1104a5f0fb15SPaul Saab 	cshift = 0;
1105a5f0fb15SPaul Saab }
1106a5f0fb15SPaul Saab 
1107a5f0fb15SPaul Saab /*
1108a5f0fb15SPaul Saab  * Analogous to forw_line(), but deals with "raw lines":
1109a5f0fb15SPaul Saab  * lines which are not split for screen width.
1110a5f0fb15SPaul Saab  * {{ This is supposed to be more efficient than forw_line(). }}
1111a5f0fb15SPaul Saab  */
1112a5f0fb15SPaul Saab 	public POSITION
1113720c436cSXin LI forw_raw_line(curr_pos, linep, line_lenp)
1114a5f0fb15SPaul Saab 	POSITION curr_pos;
1115a5f0fb15SPaul Saab 	char **linep;
1116720c436cSXin LI 	int *line_lenp;
1117a5f0fb15SPaul Saab {
1118c9346414SPaul Saab 	register int n;
1119a5f0fb15SPaul Saab 	register int c;
1120a5f0fb15SPaul Saab 	POSITION new_pos;
1121a5f0fb15SPaul Saab 
1122a5f0fb15SPaul Saab 	if (curr_pos == NULL_POSITION || ch_seek(curr_pos) ||
1123a5f0fb15SPaul Saab 		(c = ch_forw_get()) == EOI)
1124a5f0fb15SPaul Saab 		return (NULL_POSITION);
1125a5f0fb15SPaul Saab 
1126c9346414SPaul Saab 	n = 0;
1127a5f0fb15SPaul Saab 	for (;;)
1128a5f0fb15SPaul Saab 	{
112989dd99dcSXin LI 		if (c == '\n' || c == EOI || ABORT_SIGS())
1130a5f0fb15SPaul Saab 		{
1131a5f0fb15SPaul Saab 			new_pos = ch_tell();
1132a5f0fb15SPaul Saab 			break;
1133a5f0fb15SPaul Saab 		}
1134c9346414SPaul Saab 		if (n >= size_linebuf-1)
1135c9346414SPaul Saab 		{
1136c9346414SPaul Saab 			if (expand_linebuf())
1137a5f0fb15SPaul Saab 			{
1138a5f0fb15SPaul Saab 				/*
1139a5f0fb15SPaul Saab 				 * Overflowed the input buffer.
1140a5f0fb15SPaul Saab 				 * Pretend the line ended here.
1141a5f0fb15SPaul Saab 				 */
1142a5f0fb15SPaul Saab 				new_pos = ch_tell() - 1;
1143a5f0fb15SPaul Saab 				break;
1144a5f0fb15SPaul Saab 			}
1145c9346414SPaul Saab 		}
1146c9346414SPaul Saab 		linebuf[n++] = c;
1147a5f0fb15SPaul Saab 		c = ch_forw_get();
1148a5f0fb15SPaul Saab 	}
1149c9346414SPaul Saab 	linebuf[n] = '\0';
1150a5f0fb15SPaul Saab 	if (linep != NULL)
1151a5f0fb15SPaul Saab 		*linep = linebuf;
1152720c436cSXin LI 	if (line_lenp != NULL)
1153720c436cSXin LI 		*line_lenp = n;
1154a5f0fb15SPaul Saab 	return (new_pos);
1155a5f0fb15SPaul Saab }
1156a5f0fb15SPaul Saab 
1157a5f0fb15SPaul Saab /*
1158a5f0fb15SPaul Saab  * Analogous to back_line(), but deals with "raw lines".
1159a5f0fb15SPaul Saab  * {{ This is supposed to be more efficient than back_line(). }}
1160a5f0fb15SPaul Saab  */
1161a5f0fb15SPaul Saab 	public POSITION
1162720c436cSXin LI back_raw_line(curr_pos, linep, line_lenp)
1163a5f0fb15SPaul Saab 	POSITION curr_pos;
1164a5f0fb15SPaul Saab 	char **linep;
1165720c436cSXin LI 	int *line_lenp;
1166a5f0fb15SPaul Saab {
1167c9346414SPaul Saab 	register int n;
1168a5f0fb15SPaul Saab 	register int c;
1169a5f0fb15SPaul Saab 	POSITION new_pos;
1170a5f0fb15SPaul Saab 
1171a5f0fb15SPaul Saab 	if (curr_pos == NULL_POSITION || curr_pos <= ch_zero() ||
1172a5f0fb15SPaul Saab 		ch_seek(curr_pos-1))
1173a5f0fb15SPaul Saab 		return (NULL_POSITION);
1174a5f0fb15SPaul Saab 
1175c9346414SPaul Saab 	n = size_linebuf;
1176c9346414SPaul Saab 	linebuf[--n] = '\0';
1177a5f0fb15SPaul Saab 	for (;;)
1178a5f0fb15SPaul Saab 	{
1179a5f0fb15SPaul Saab 		c = ch_back_get();
118089dd99dcSXin LI 		if (c == '\n' || ABORT_SIGS())
1181a5f0fb15SPaul Saab 		{
1182a5f0fb15SPaul Saab 			/*
1183a5f0fb15SPaul Saab 			 * This is the newline ending the previous line.
1184a5f0fb15SPaul Saab 			 * We have hit the beginning of the line.
1185a5f0fb15SPaul Saab 			 */
1186a5f0fb15SPaul Saab 			new_pos = ch_tell() + 1;
1187a5f0fb15SPaul Saab 			break;
1188a5f0fb15SPaul Saab 		}
1189a5f0fb15SPaul Saab 		if (c == EOI)
1190a5f0fb15SPaul Saab 		{
1191a5f0fb15SPaul Saab 			/*
1192a5f0fb15SPaul Saab 			 * We have hit the beginning of the file.
1193a5f0fb15SPaul Saab 			 * This must be the first line in the file.
1194a5f0fb15SPaul Saab 			 * This must, of course, be the beginning of the line.
1195a5f0fb15SPaul Saab 			 */
1196a5f0fb15SPaul Saab 			new_pos = ch_zero();
1197a5f0fb15SPaul Saab 			break;
1198a5f0fb15SPaul Saab 		}
1199c9346414SPaul Saab 		if (n <= 0)
1200c9346414SPaul Saab 		{
1201c9346414SPaul Saab 			int old_size_linebuf = size_linebuf;
1202c9346414SPaul Saab 			char *fm;
1203c9346414SPaul Saab 			char *to;
1204c9346414SPaul Saab 			if (expand_linebuf())
1205a5f0fb15SPaul Saab 			{
1206a5f0fb15SPaul Saab 				/*
1207a5f0fb15SPaul Saab 				 * Overflowed the input buffer.
1208a5f0fb15SPaul Saab 				 * Pretend the line ended here.
1209a5f0fb15SPaul Saab 				 */
1210a5f0fb15SPaul Saab 				new_pos = ch_tell() + 1;
1211a5f0fb15SPaul Saab 				break;
1212a5f0fb15SPaul Saab 			}
1213c9346414SPaul Saab 			/*
1214c9346414SPaul Saab 			 * Shift the data to the end of the new linebuf.
1215c9346414SPaul Saab 			 */
12161d5cfebaSTim J. Robbins 			for (fm = linebuf + old_size_linebuf - 1,
12171d5cfebaSTim J. Robbins 			      to = linebuf + size_linebuf - 1;
1218c9346414SPaul Saab 			     fm >= linebuf;  fm--, to--)
1219c9346414SPaul Saab 				*to = *fm;
1220c9346414SPaul Saab 			n = size_linebuf - old_size_linebuf;
1221c9346414SPaul Saab 		}
1222c9346414SPaul Saab 		linebuf[--n] = c;
1223a5f0fb15SPaul Saab 	}
1224a5f0fb15SPaul Saab 	if (linep != NULL)
1225c9346414SPaul Saab 		*linep = &linebuf[n];
1226720c436cSXin LI 	if (line_lenp != NULL)
1227720c436cSXin LI 		*line_lenp = size_linebuf - 1 - n;
1228a5f0fb15SPaul Saab 	return (new_pos);
1229a5f0fb15SPaul Saab }
1230