line.c revision 172471
1/* $FreeBSD: head/contrib/less/line.c 172471 2007-10-08 16:17:42Z delphij $ */
2/*
3 * Copyright (C) 1984-2007  Mark Nudelman
4 *
5 * You may distribute under the terms of either the GNU General Public
6 * License or the Less License, as specified in the README file.
7 *
8 * For more information about less, or for information on how to
9 * contact the author, see the README file.
10 */
11
12
13/*
14 * Routines to manipulate the "line buffer".
15 * The line buffer holds a line of output as it is being built
16 * in preparation for output to the screen.
17 */
18
19#include "less.h"
20#include "charset.h"
21
22static char *linebuf = NULL;	/* Buffer which holds the current output line */
23static char *attr = NULL;	/* Extension of linebuf to hold attributes */
24public int size_linebuf = 0;	/* Size of line buffer (and attr buffer) */
25
26static int cshift;		/* Current left-shift of output line buffer */
27public int hshift;		/* Desired left-shift of output line buffer */
28public int tabstops[TABSTOP_MAX] = { 0 }; /* Custom tabstops */
29public int ntabstops = 1;	/* Number of tabstops */
30public int tabdefault = 8;	/* Default repeated tabstops */
31
32static int curr;		/* Index into linebuf */
33static int column;		/* Printable length, accounting for
34				   backspaces, etc. */
35static int overstrike;		/* Next char should overstrike previous char */
36static int last_overstrike = AT_NORMAL;
37static int is_null_line;	/* There is no current line */
38static int lmargin;		/* Left margin */
39static int line_matches;	/* Number of search matches in this line */
40static char pendc;
41static POSITION pendpos;
42static char *end_ansi_chars;
43static char *mid_ansi_chars;
44
45static int attr_swidth();
46static int attr_ewidth();
47static int do_append();
48
49extern int sigs;
50extern int bs_mode;
51extern int linenums;
52extern int ctldisp;
53extern int twiddle;
54extern int binattr;
55extern int status_col;
56extern int auto_wrap, ignaw;
57extern int bo_s_width, bo_e_width;
58extern int ul_s_width, ul_e_width;
59extern int bl_s_width, bl_e_width;
60extern int so_s_width, so_e_width;
61extern int sc_width, sc_height;
62extern int utf_mode;
63extern int oldbot;
64extern POSITION start_attnpos;
65extern POSITION end_attnpos;
66
67static char mbc_buf[MAX_UTF_CHAR_LEN];
68static int mbc_buf_len = 0;
69static int mbc_buf_index = 0;
70static POSITION mbc_pos;
71
72/*
73 * Initialize from environment variables.
74 */
75	public void
76init_line()
77{
78	end_ansi_chars = lgetenv("LESSANSIENDCHARS");
79	if (end_ansi_chars == NULL || *end_ansi_chars == '\0')
80		end_ansi_chars = "m";
81
82	mid_ansi_chars = lgetenv("LESSANSIMIDCHARS");
83	if (mid_ansi_chars == NULL || *mid_ansi_chars == '\0')
84		mid_ansi_chars = "0123456789;[?!\"'#%()*+ ";
85
86	linebuf = (char *) ecalloc(LINEBUF_SIZE, sizeof(char));
87	attr = (char *) ecalloc(LINEBUF_SIZE, sizeof(char));
88	size_linebuf = LINEBUF_SIZE;
89}
90
91/*
92 * Expand the line buffer.
93 */
94	static int
95expand_linebuf()
96{
97	/* Double the size of the line buffer. */
98	int new_size = size_linebuf * 2;
99
100	/* Just realloc to expand the buffer, if we can. */
101#if HAVE_REALLOC
102	char *new_buf = (char *) realloc(linebuf, new_size);
103	char *new_attr = (char *) realloc(attr, new_size);
104#else
105	char *new_buf = (char *) calloc(new_size, sizeof(char));
106	char *new_attr = (char *) calloc(new_size, sizeof(char));
107#endif
108	if (new_buf == NULL || new_attr == NULL)
109	{
110		if (new_attr != NULL)
111			free(new_attr);
112		if (new_buf != NULL)
113			free(new_buf);
114		return 1;
115	}
116#if HAVE_REALLOC
117	/*
118	 * We realloc'd the buffers; they already have the old contents.
119	 */
120	#if 0
121	memset(new_buf + size_linebuf, 0, new_size - size_linebuf);
122	memset(new_attr + size_linebuf, 0, new_size - size_linebuf);
123	#endif
124#else
125	/*
126	 * We just calloc'd the buffers; copy the old contents.
127	 */
128	memcpy(new_buf, linebuf, size_linebuf * sizeof(char));
129	memcpy(new_attr, attr, size_linebuf * sizeof(char));
130	free(attr);
131	free(linebuf);
132#endif
133	linebuf = new_buf;
134	attr = new_attr;
135	size_linebuf = new_size;
136	return 0;
137}
138
139/*
140 * Is a character ASCII?
141 */
142	public int
143is_ascii_char(ch)
144	LWCHAR ch;
145{
146	return (ch <= 0x7F);
147}
148
149/*
150 * Rewind the line buffer.
151 */
152	public void
153prewind()
154{
155	curr = 0;
156	column = 0;
157	cshift = 0;
158	overstrike = 0;
159	last_overstrike = AT_NORMAL;
160	mbc_buf_len = 0;
161	is_null_line = 0;
162	pendc = '\0';
163	lmargin = 0;
164	if (status_col)
165		lmargin += 1;
166#if HILITE_SEARCH
167	line_matches = 0;
168#endif
169}
170
171/*
172 * Insert the line number (of the given position) into the line buffer.
173 */
174	public void
175plinenum(pos)
176	POSITION pos;
177{
178	register LINENUM linenum = 0;
179	register int i;
180
181	if (linenums == OPT_ONPLUS)
182	{
183		/*
184		 * Get the line number and put it in the current line.
185		 * {{ Note: since find_linenum calls forw_raw_line,
186		 *    it may seek in the input file, requiring the caller
187		 *    of plinenum to re-seek if necessary. }}
188		 * {{ Since forw_raw_line modifies linebuf, we must
189		 *    do this first, before storing anything in linebuf. }}
190		 */
191		linenum = find_linenum(pos);
192	}
193
194	/*
195	 * Display a status column if the -J option is set.
196	 */
197	if (status_col)
198	{
199		linebuf[curr] = ' ';
200		if (start_attnpos != NULL_POSITION &&
201		    pos >= start_attnpos && pos < end_attnpos)
202			attr[curr] = AT_NORMAL|AT_HILITE;
203		else
204			attr[curr] = AT_NORMAL;
205		curr++;
206		column++;
207	}
208	/*
209	 * Display the line number at the start of each line
210	 * if the -N option is set.
211	 */
212	if (linenums == OPT_ONPLUS)
213	{
214		char buf[INT_STRLEN_BOUND(pos) + 2];
215		int n;
216
217		linenumtoa(linenum, buf);
218		n = strlen(buf);
219		if (n < MIN_LINENUM_WIDTH)
220			n = MIN_LINENUM_WIDTH;
221		sprintf(linebuf+curr, "%*s ", n, buf);
222		n++;  /* One space after the line number. */
223		for (i = 0; i < n; i++)
224			attr[curr+i] = AT_NORMAL;
225		curr += n;
226		column += n;
227		lmargin += n;
228	}
229
230	/*
231	 * Append enough spaces to bring us to the lmargin.
232	 */
233	while (column < lmargin)
234	{
235		linebuf[curr] = ' ';
236		attr[curr++] = AT_NORMAL;
237		column++;
238	}
239}
240
241/*
242 * Shift the input line left.
243 * This means discarding N printable chars at the start of the buffer.
244 */
245	static void
246pshift(shift)
247	int shift;
248{
249	LWCHAR prev_ch = 0;
250	unsigned char c;
251	int shifted = 0;
252	int to;
253	int from;
254	int len;
255	int width;
256	int prev_attr;
257	int next_attr;
258
259	if (shift > column - lmargin)
260		shift = column - lmargin;
261	if (shift > curr - lmargin)
262		shift = curr - lmargin;
263
264	to = from = lmargin;
265	/*
266	 * We keep on going when shifted == shift
267	 * to get all combining chars.
268	 */
269	while (shifted <= shift && from < curr)
270	{
271		c = linebuf[from];
272		if (ctldisp == OPT_ONPLUS && IS_CSI_START(c))
273		{
274			/* Keep cumulative effect.  */
275			linebuf[to] = c;
276			attr[to++] = attr[from++];
277			while (from < curr && linebuf[from])
278			{
279				linebuf[to] = linebuf[from];
280				attr[to++] = attr[from];
281				if (!is_ansi_middle(linebuf[from++]))
282					break;
283			}
284			continue;
285		}
286
287		width = 0;
288
289		if (!IS_ASCII_OCTET(c) && utf_mode)
290		{
291			/* Assumes well-formedness validation already done.  */
292			LWCHAR ch;
293
294			len = utf_len(c);
295			if (from + len > curr)
296				break;
297			ch = get_wchar(linebuf + from);
298			if (!is_composing_char(ch) && !is_combining_char(prev_ch, ch))
299				width = is_wide_char(ch) ? 2 : 1;
300			prev_ch = ch;
301		} else
302		{
303			len = 1;
304			if (c == '\b')
305				/* XXX - Incorrect if several '\b' in a row.  */
306				width = (utf_mode && is_wide_char(prev_ch)) ? -2 : -1;
307			else if (!control_char(c))
308				width = 1;
309			prev_ch = 0;
310		}
311
312		if (width == 2 && shift - shifted == 1) {
313			/* Should never happen when called by pshift_all().  */
314			attr[to] = attr[from];
315			/*
316			 * Assume a wide_char will never be the first half of a
317			 * combining_char pair, so reset prev_ch in case we're
318			 * followed by a '\b'.
319			 */
320			prev_ch = linebuf[to++] = ' ';
321			from += len;
322			shifted++;
323			continue;
324		}
325
326		/* Adjust width for magic cookies. */
327		prev_attr = (to > 0) ? attr[to-1] : AT_NORMAL;
328		next_attr = (from + len < curr) ? attr[from + len] : prev_attr;
329		if (!is_at_equiv(attr[from], prev_attr) &&
330			!is_at_equiv(attr[from], next_attr))
331		{
332			width += attr_swidth(attr[from]);
333			if (from + len < curr)
334				width += attr_ewidth(attr[from]);
335			if (is_at_equiv(prev_attr, next_attr))
336			{
337				width += attr_ewidth(prev_attr);
338				if (from + len < curr)
339					width += attr_swidth(next_attr);
340			}
341		}
342
343		if (shift - shifted < width)
344			break;
345		from += len;
346		shifted += width;
347		if (shifted < 0)
348			shifted = 0;
349	}
350	while (from < curr)
351	{
352		linebuf[to] = linebuf[from];
353		attr[to++] = attr[from++];
354	}
355	curr = to;
356	column -= shifted;
357	cshift += shifted;
358}
359
360/*
361 *
362 */
363	public void
364pshift_all()
365{
366	pshift(column);
367}
368
369/*
370 * Return the printing width of the start (enter) sequence
371 * for a given character attribute.
372 */
373	static int
374attr_swidth(a)
375	int a;
376{
377	int w = 0;
378
379	a = apply_at_specials(a);
380
381	if (a & AT_UNDERLINE)
382		w += ul_s_width;
383	if (a & AT_BOLD)
384		w += bo_s_width;
385	if (a & AT_BLINK)
386		w += bl_s_width;
387	if (a & AT_STANDOUT)
388		w += so_s_width;
389
390	return w;
391}
392
393/*
394 * Return the printing width of the end (exit) sequence
395 * for a given character attribute.
396 */
397	static int
398attr_ewidth(a)
399	int a;
400{
401	int w = 0;
402
403	a = apply_at_specials(a);
404
405	if (a & AT_UNDERLINE)
406		w += ul_e_width;
407	if (a & AT_BOLD)
408		w += bo_e_width;
409	if (a & AT_BLINK)
410		w += bl_e_width;
411	if (a & AT_STANDOUT)
412		w += so_e_width;
413
414	return w;
415}
416
417/*
418 * Return the printing width of a given character and attribute,
419 * if the character were added to the current position in the line buffer.
420 * Adding a character with a given attribute may cause an enter or exit
421 * attribute sequence to be inserted, so this must be taken into account.
422 */
423	static int
424pwidth(ch, a, prev_ch)
425	LWCHAR ch;
426	int a;
427	LWCHAR prev_ch;
428{
429	int w;
430
431	if (ch == '\b')
432		/*
433		 * Backspace moves backwards one or two positions.
434		 * XXX - Incorrect if several '\b' in a row.
435		 */
436		return (utf_mode && is_wide_char(prev_ch)) ? -2 : -1;
437
438	if (!utf_mode || is_ascii_char(ch))
439	{
440		if (control_char((char)ch))
441		{
442			/*
443			 * Control characters do unpredictable things,
444			 * so we don't even try to guess; say it doesn't move.
445			 * This can only happen if the -r flag is in effect.
446			 */
447			return (0);
448		}
449	} else
450	{
451		if (is_composing_char(ch) || is_combining_char(prev_ch, ch))
452		{
453			/*
454			 * Composing and combining chars take up no space.
455			 *
456			 * Some terminals, upon failure to compose a
457			 * composing character with the character(s) that
458			 * precede(s) it will actually take up one column
459			 * for the composing character; there isn't much
460			 * we could do short of testing the (complex)
461			 * composition process ourselves and printing
462			 * a binary representation when it fails.
463			 */
464			return (0);
465		}
466	}
467
468	/*
469	 * Other characters take one or two columns,
470	 * plus the width of any attribute enter/exit sequence.
471	 */
472	w = 1;
473	if (is_wide_char(ch))
474		w++;
475	if (curr > 0 && !is_at_equiv(attr[curr-1], a))
476		w += attr_ewidth(attr[curr-1]);
477	if ((apply_at_specials(a) != AT_NORMAL) &&
478	    (curr == 0 || !is_at_equiv(attr[curr-1], a)))
479		w += attr_swidth(a);
480	return (w);
481}
482
483/*
484 * Delete to the previous base character in the line buffer.
485 * Return 1 if one is found.
486 */
487	static int
488backc()
489{
490	LWCHAR prev_ch;
491	char *p = linebuf + curr;
492	LWCHAR ch = step_char(&p, -1, linebuf + lmargin);
493	int width;
494
495	/* This assumes that there is no '\b' in linebuf.  */
496	while (   curr > lmargin
497	       && column > lmargin
498	       && (!(attr[curr - 1] & (AT_ANSI|AT_BINARY))))
499	{
500		curr = p - linebuf;
501		prev_ch = step_char(&p, -1, linebuf + lmargin);
502		width = pwidth(ch, attr[curr], prev_ch);
503		column -= width;
504		if (width > 0)
505			return 1;
506		ch = prev_ch;
507	}
508
509	return 0;
510}
511
512/*
513 * Are we currently within a recognized ANSI escape sequence?
514 */
515	static int
516in_ansi_esc_seq()
517{
518	char *p;
519
520	/*
521	 * Search backwards for either an ESC (which means we ARE in a seq);
522	 * or an end char (which means we're NOT in a seq).
523	 */
524	for (p = &linebuf[curr];  p > linebuf; )
525	{
526		LWCHAR ch = step_char(&p, -1, linebuf);
527		if (IS_CSI_START(ch))
528			return (1);
529		if (!is_ansi_middle(ch))
530			return (0);
531	}
532	return (0);
533}
534
535/*
536 * Is a character the end of an ANSI escape sequence?
537 */
538	public int
539is_ansi_end(ch)
540	LWCHAR ch;
541{
542	if (!is_ascii_char(ch))
543		return (0);
544	return (strchr(end_ansi_chars, (char) ch) != NULL);
545}
546
547/*
548 *
549 */
550	public int
551is_ansi_middle(ch)
552	LWCHAR ch;
553{
554	if (!is_ascii_char(ch))
555		return (0);
556	if (is_ansi_end(ch))
557		return (0);
558	return (strchr(mid_ansi_chars, (char) ch) != NULL);
559}
560
561/*
562 * Append a character and attribute to the line buffer.
563 */
564#define	STORE_CHAR(ch,a,rep,pos) \
565	do { \
566		if (store_char((ch),(a),(rep),(pos))) return (1); \
567	} while (0)
568
569	static int
570store_char(ch, a, rep, pos)
571	LWCHAR ch;
572	int a;
573	char *rep;
574	POSITION pos;
575{
576	int w;
577	int replen;
578	char cs;
579
580	w = (a & (AT_UNDERLINE|AT_BOLD));	/* Pre-use w.  */
581	if (w != AT_NORMAL)
582		last_overstrike = w;
583
584#if HILITE_SEARCH
585	{
586		int matches;
587		if (is_hilited(pos, pos+1, 0, &matches))
588		{
589			/*
590			 * This character should be highlighted.
591			 * Override the attribute passed in.
592			 */
593			if (a != AT_ANSI)
594				a |= AT_HILITE;
595		}
596		line_matches += matches;
597	}
598#endif
599
600	if (ctldisp == OPT_ONPLUS && in_ansi_esc_seq())
601	{
602		if (!is_ansi_end(ch) && !is_ansi_middle(ch)) {
603			/* Remove whole unrecognized sequence.  */
604			do {
605				--curr;
606			} while (!IS_CSI_START(linebuf[curr]));
607			return 0;
608		}
609		a = AT_ANSI;	/* Will force re-AT_'ing around it.  */
610		w = 0;
611	}
612	else if (ctldisp == OPT_ONPLUS && IS_CSI_START(ch))
613	{
614		a = AT_ANSI;	/* Will force re-AT_'ing around it.  */
615		w = 0;
616	}
617	else
618	{
619		char *p = &linebuf[curr];
620		LWCHAR prev_ch = step_char(&p, -1, linebuf);
621		w = pwidth(ch, a, prev_ch);
622	}
623
624	if (ctldisp != OPT_ON && column + w + attr_ewidth(a) > sc_width)
625		/*
626		 * Won't fit on screen.
627		 */
628		return (1);
629
630	if (rep == NULL)
631	{
632		cs = (char) ch;
633		rep = &cs;
634		replen = 1;
635	} else
636	{
637		replen = utf_len(rep[0]);
638	}
639	if (curr + replen >= size_linebuf-6)
640	{
641		/*
642		 * Won't fit in line buffer.
643		 * Try to expand it.
644		 */
645		if (expand_linebuf())
646			return (1);
647	}
648
649	while (replen-- > 0)
650	{
651		linebuf[curr] = *rep++;
652		attr[curr] = a;
653		curr++;
654	}
655	column += w;
656	return (0);
657}
658
659/*
660 * Append a tab to the line buffer.
661 * Store spaces to represent the tab.
662 */
663#define	STORE_TAB(a,pos) \
664	do { if (store_tab((a),(pos))) return (1); } while (0)
665
666	static int
667store_tab(attr, pos)
668	int attr;
669	POSITION pos;
670{
671	int to_tab = column + cshift - lmargin;
672	int i;
673
674	if (ntabstops < 2 || to_tab >= tabstops[ntabstops-1])
675		to_tab = tabdefault -
676		     ((to_tab - tabstops[ntabstops-1]) % tabdefault);
677	else
678	{
679		for (i = ntabstops - 2;  i >= 0;  i--)
680			if (to_tab >= tabstops[i])
681				break;
682		to_tab = tabstops[i+1] - to_tab;
683	}
684
685	if (column + to_tab - 1 + pwidth(' ', attr, 0) + attr_ewidth(attr) > sc_width)
686		return 1;
687
688	do {
689		STORE_CHAR(' ', attr, " ", pos);
690	} while (--to_tab > 0);
691	return 0;
692}
693
694#define STORE_PRCHAR(c, pos) \
695	do { if (store_prchar((c), (pos))) return 1; } while (0)
696
697	static int
698store_prchar(c, pos)
699	char c;
700	POSITION pos;
701{
702	char *s;
703
704	/*
705	 * Convert to printable representation.
706	 */
707	s = prchar(c);
708
709	/*
710	 * Make sure we can get the entire representation
711	 * of the character on this line.
712	 */
713	if (column + (int) strlen(s) - 1 +
714            pwidth(' ', binattr, 0) + attr_ewidth(binattr) > sc_width)
715		return 1;
716
717	for ( ;  *s != 0;  s++)
718		STORE_CHAR(*s, AT_BINARY, NULL, pos);
719
720	return 0;
721}
722
723	static int
724flush_mbc_buf(pos)
725	POSITION pos;
726{
727	int i;
728
729	for (i = 0; i < mbc_buf_index; i++)
730		if (store_prchar(mbc_buf[i], pos))
731			return mbc_buf_index - i;
732
733	return 0;
734}
735
736/*
737 * Append a character to the line buffer.
738 * Expand tabs into spaces, handle underlining, boldfacing, etc.
739 * Returns 0 if ok, 1 if couldn't fit in buffer.
740 */
741	public int
742pappend(c, pos)
743	char c;
744	POSITION pos;
745{
746	int r;
747
748	if (pendc)
749	{
750		if (do_append(pendc, NULL, pendpos))
751			/*
752			 * Oops.  We've probably lost the char which
753			 * was in pendc, since caller won't back up.
754			 */
755			return (1);
756		pendc = '\0';
757	}
758
759	if (c == '\r' && bs_mode == BS_SPECIAL)
760	{
761		if (mbc_buf_len > 0)  /* utf_mode must be on. */
762		{
763			/* Flush incomplete (truncated) sequence. */
764			r = flush_mbc_buf(mbc_pos);
765			mbc_buf_index = r + 1;
766			mbc_buf_len = 0;
767			if (r)
768				return (mbc_buf_index);
769		}
770
771		/*
772		 * Don't put the CR into the buffer until we see
773		 * the next char.  If the next char is a newline,
774		 * discard the CR.
775		 */
776		pendc = c;
777		pendpos = pos;
778		return (0);
779	}
780
781	if (!utf_mode)
782	{
783		r = do_append((LWCHAR) c, NULL, pos);
784	} else
785	{
786		/* Perform strict validation in all possible cases. */
787		if (mbc_buf_len == 0)
788		{
789		retry:
790			mbc_buf_index = 1;
791			*mbc_buf = c;
792			if (IS_ASCII_OCTET(c))
793				r = do_append((LWCHAR) c, NULL, pos);
794			else if (IS_UTF8_LEAD(c))
795			{
796				mbc_buf_len = utf_len(c);
797				mbc_pos = pos;
798				return (0);
799			} else
800				/* UTF8_INVALID or stray UTF8_TRAIL */
801				r = flush_mbc_buf(pos);
802		} else if (IS_UTF8_TRAIL(c))
803		{
804			mbc_buf[mbc_buf_index++] = c;
805			if (mbc_buf_index < mbc_buf_len)
806				return (0);
807			if (is_utf8_well_formed(mbc_buf))
808				r = do_append(get_wchar(mbc_buf), mbc_buf, mbc_pos);
809			else
810				/* Complete, but not shortest form, sequence. */
811				mbc_buf_index = r = flush_mbc_buf(mbc_pos);
812			mbc_buf_len = 0;
813		} else
814		{
815			/* Flush incomplete (truncated) sequence.  */
816			r = flush_mbc_buf(mbc_pos);
817			mbc_buf_index = r + 1;
818			mbc_buf_len = 0;
819			/* Handle new char.  */
820			if (!r)
821				goto retry;
822 		}
823	}
824
825	/*
826	 * If we need to shift the line, do it.
827	 * But wait until we get to at least the middle of the screen,
828	 * so shifting it doesn't affect the chars we're currently
829	 * pappending.  (Bold & underline can get messed up otherwise.)
830	 */
831	if (cshift < hshift && column > sc_width / 2)
832	{
833		linebuf[curr] = '\0';
834		pshift(hshift - cshift);
835	}
836	if (r)
837	{
838		/* How many chars should caller back up? */
839		r = (!utf_mode) ? 1 : mbc_buf_index;
840	}
841	return (r);
842}
843
844	static int
845do_append(ch, rep, pos)
846	LWCHAR ch;
847	char *rep;
848	POSITION pos;
849{
850	register int a;
851	LWCHAR prev_ch;
852
853	a = AT_NORMAL;
854
855	if (ch == '\b')
856	{
857		if (bs_mode == BS_CONTROL)
858			goto do_control_char;
859
860		/*
861		 * A better test is needed here so we don't
862		 * backspace over part of the printed
863		 * representation of a binary character.
864		 */
865		if (   curr <= lmargin
866		    || column <= lmargin
867		    || (attr[curr - 1] & (AT_ANSI|AT_BINARY)))
868			STORE_PRCHAR('\b', pos);
869		else if (bs_mode == BS_NORMAL)
870			STORE_CHAR(ch, AT_NORMAL, NULL, pos);
871		else if (bs_mode == BS_SPECIAL)
872			overstrike = backc();
873
874		return 0;
875	}
876
877	if (overstrike > 0)
878	{
879		/*
880		 * Overstrike the character at the current position
881		 * in the line buffer.  This will cause either
882		 * underline (if a "_" is overstruck),
883		 * bold (if an identical character is overstruck),
884		 * or just deletion of the character in the buffer.
885		 */
886		overstrike = utf_mode ? -1 : 0;
887		/* To be correct, this must be a base character.  */
888		prev_ch = get_wchar(linebuf + curr);
889		a = attr[curr];
890		if (ch == prev_ch)
891		{
892			/*
893			 * Overstriking a char with itself means make it bold.
894			 * But overstriking an underscore with itself is
895			 * ambiguous.  It could mean make it bold, or
896			 * it could mean make it underlined.
897			 * Use the previous overstrike to resolve it.
898			 */
899			if (ch == '_')
900			{
901				if ((a & (AT_BOLD|AT_UNDERLINE)) != AT_NORMAL)
902					a |= (AT_BOLD|AT_UNDERLINE);
903				else if (last_overstrike != AT_NORMAL)
904					a |= last_overstrike;
905				else
906					a |= AT_BOLD;
907			} else
908				a |= AT_BOLD;
909		} else if (ch == '_')
910		{
911			a |= AT_UNDERLINE;
912			ch = prev_ch;
913			rep = linebuf + curr;
914		} else if (prev_ch == '_')
915		{
916			a |= AT_UNDERLINE;
917		}
918		/* Else we replace prev_ch, but we keep its attributes.  */
919	} else if (overstrike < 0)
920	{
921		if (   is_composing_char(ch)
922		    || is_combining_char(get_wchar(linebuf + curr), ch))
923			/* Continuation of the same overstrike.  */
924			a = last_overstrike;
925		else
926			overstrike = 0;
927	}
928
929	if (ch == '\t')
930	{
931		/*
932		 * Expand a tab into spaces.
933		 */
934		switch (bs_mode)
935		{
936		case BS_CONTROL:
937			goto do_control_char;
938		case BS_NORMAL:
939		case BS_SPECIAL:
940			STORE_TAB(a, pos);
941			break;
942		}
943	} else if ((!utf_mode || is_ascii_char(ch)) && control_char((char)ch))
944	{
945	do_control_char:
946		if (ctldisp == OPT_ON || (ctldisp == OPT_ONPLUS && IS_CSI_START(ch)))
947		{
948			/*
949			 * Output as a normal character.
950			 */
951			STORE_CHAR(ch, AT_NORMAL, rep, pos);
952		} else
953		{
954			STORE_PRCHAR((char) ch, pos);
955		}
956	} else if (utf_mode && ctldisp != OPT_ON && is_ubin_char(ch))
957	{
958		char *s;
959
960		s = prutfchar(ch);
961
962		if (column + (int) strlen(s) - 1 +
963		    pwidth(' ', binattr, 0) + attr_ewidth(binattr) > sc_width)
964			return (1);
965
966		for ( ;  *s != 0;  s++)
967			STORE_CHAR(*s, AT_BINARY, NULL, pos);
968 	} else
969	{
970		STORE_CHAR(ch, a, rep, pos);
971	}
972 	return (0);
973}
974
975/*
976 *
977 */
978	public int
979pflushmbc()
980{
981	int r = 0;
982
983	if (mbc_buf_len > 0)
984	{
985		/* Flush incomplete (truncated) sequence.  */
986		r = flush_mbc_buf(mbc_pos);
987		mbc_buf_len = 0;
988	}
989	return r;
990}
991
992/*
993 * Terminate the line in the line buffer.
994 */
995	public void
996pdone(endline)
997	int endline;
998{
999	int nl;
1000
1001	(void) pflushmbc();
1002
1003	if (pendc && (pendc != '\r' || !endline))
1004		/*
1005		 * If we had a pending character, put it in the buffer.
1006		 * But discard a pending CR if we are at end of line
1007		 * (that is, discard the CR in a CR/LF sequence).
1008		 */
1009		(void) do_append(pendc, NULL, pendpos);
1010
1011	/*
1012	 * Make sure we've shifted the line, if we need to.
1013	 */
1014	if (cshift < hshift)
1015		pshift(hshift - cshift);
1016
1017	if (ctldisp == OPT_ONPLUS && is_ansi_end('m'))
1018	{
1019		/* Switch to normal attribute at end of line. */
1020		char *p = "\033[m";
1021		for ( ;  *p != '\0';  p++)
1022		{
1023			linebuf[curr] = *p;
1024			attr[curr++] = AT_ANSI;
1025		}
1026	}
1027
1028	/*
1029	 * Add a newline if necessary,
1030	 * and append a '\0' to the end of the line.
1031	 * We output a newline if we're not at the right edge of the screen,
1032	 * or if the terminal doesn't auto wrap,
1033	 * or if this is really the end of the line AND the terminal ignores
1034	 * a newline at the right edge.
1035	 * (In the last case we don't want to output a newline if the terminal
1036	 * doesn't ignore it since that would produce an extra blank line.
1037	 * But we do want to output a newline if the terminal ignores it in case
1038	 * the next line is blank.  In that case the single newline output for
1039	 * that blank line would be ignored!)
1040	 */
1041	if (!oldbot)
1042		nl = (column < sc_width || !auto_wrap || (endline && ignaw) || ctldisp == OPT_ON);
1043	else
1044		nl = (column < sc_width || !auto_wrap || ignaw || ctldisp == OPT_ON);
1045	if (nl)
1046	{
1047		linebuf[curr] = '\n';
1048		attr[curr] = AT_NORMAL;
1049		curr++;
1050	}
1051	linebuf[curr] = '\0';
1052	attr[curr] = AT_NORMAL;
1053
1054#if HILITE_SEARCH
1055	if (status_col && line_matches > 0)
1056	{
1057		linebuf[0] = '*';
1058		attr[0] = AT_NORMAL|AT_HILITE;
1059	}
1060#endif
1061}
1062
1063/*
1064 * Get a character from the current line.
1065 * Return the character as the function return value,
1066 * and the character attribute in *ap.
1067 */
1068	public int
1069gline(i, ap)
1070	register int i;
1071	register int *ap;
1072{
1073	if (is_null_line)
1074	{
1075		/*
1076		 * If there is no current line, we pretend the line is
1077		 * either "~" or "", depending on the "twiddle" flag.
1078		 */
1079		if (twiddle)
1080		{
1081			if (i == 0)
1082			{
1083				*ap = AT_BOLD;
1084				return '~';
1085			}
1086			--i;
1087		}
1088		/* Make sure we're back to AT_NORMAL before the '\n'.  */
1089		*ap = AT_NORMAL;
1090		return i ? '\0' : '\n';
1091	}
1092
1093	*ap = attr[i];
1094	return (linebuf[i] & 0xFF);
1095}
1096
1097/*
1098 * Indicate that there is no current line.
1099 */
1100	public void
1101null_line()
1102{
1103	is_null_line = 1;
1104	cshift = 0;
1105}
1106
1107/*
1108 * Analogous to forw_line(), but deals with "raw lines":
1109 * lines which are not split for screen width.
1110 * {{ This is supposed to be more efficient than forw_line(). }}
1111 */
1112	public POSITION
1113forw_raw_line(curr_pos, linep, line_lenp)
1114	POSITION curr_pos;
1115	char **linep;
1116	int *line_lenp;
1117{
1118	register int n;
1119	register int c;
1120	POSITION new_pos;
1121
1122	if (curr_pos == NULL_POSITION || ch_seek(curr_pos) ||
1123		(c = ch_forw_get()) == EOI)
1124		return (NULL_POSITION);
1125
1126	n = 0;
1127	for (;;)
1128	{
1129		if (c == '\n' || c == EOI || ABORT_SIGS())
1130		{
1131			new_pos = ch_tell();
1132			break;
1133		}
1134		if (n >= size_linebuf-1)
1135		{
1136			if (expand_linebuf())
1137			{
1138				/*
1139				 * Overflowed the input buffer.
1140				 * Pretend the line ended here.
1141				 */
1142				new_pos = ch_tell() - 1;
1143				break;
1144			}
1145		}
1146		linebuf[n++] = c;
1147		c = ch_forw_get();
1148	}
1149	linebuf[n] = '\0';
1150	if (linep != NULL)
1151		*linep = linebuf;
1152	if (line_lenp != NULL)
1153		*line_lenp = n;
1154	return (new_pos);
1155}
1156
1157/*
1158 * Analogous to back_line(), but deals with "raw lines".
1159 * {{ This is supposed to be more efficient than back_line(). }}
1160 */
1161	public POSITION
1162back_raw_line(curr_pos, linep, line_lenp)
1163	POSITION curr_pos;
1164	char **linep;
1165	int *line_lenp;
1166{
1167	register int n;
1168	register int c;
1169	POSITION new_pos;
1170
1171	if (curr_pos == NULL_POSITION || curr_pos <= ch_zero() ||
1172		ch_seek(curr_pos-1))
1173		return (NULL_POSITION);
1174
1175	n = size_linebuf;
1176	linebuf[--n] = '\0';
1177	for (;;)
1178	{
1179		c = ch_back_get();
1180		if (c == '\n' || ABORT_SIGS())
1181		{
1182			/*
1183			 * This is the newline ending the previous line.
1184			 * We have hit the beginning of the line.
1185			 */
1186			new_pos = ch_tell() + 1;
1187			break;
1188		}
1189		if (c == EOI)
1190		{
1191			/*
1192			 * We have hit the beginning of the file.
1193			 * This must be the first line in the file.
1194			 * This must, of course, be the beginning of the line.
1195			 */
1196			new_pos = ch_zero();
1197			break;
1198		}
1199		if (n <= 0)
1200		{
1201			int old_size_linebuf = size_linebuf;
1202			char *fm;
1203			char *to;
1204			if (expand_linebuf())
1205			{
1206				/*
1207				 * Overflowed the input buffer.
1208				 * Pretend the line ended here.
1209				 */
1210				new_pos = ch_tell() + 1;
1211				break;
1212			}
1213			/*
1214			 * Shift the data to the end of the new linebuf.
1215			 */
1216			for (fm = linebuf + old_size_linebuf - 1,
1217			      to = linebuf + size_linebuf - 1;
1218			     fm >= linebuf;  fm--, to--)
1219				*to = *fm;
1220			n = size_linebuf - old_size_linebuf;
1221		}
1222		linebuf[--n] = c;
1223	}
1224	if (linep != NULL)
1225		*linep = &linebuf[n];
1226	if (line_lenp != NULL)
1227		*line_lenp = size_linebuf - 1 - n;
1228	return (new_pos);
1229}
1230