xref: /openbsd/usr.bin/mandoc/term_ascii.c (revision 84680f53)
1*84680f53Sschwarze /* $OpenBSD: term_ascii.c,v 1.55 2023/11/13 19:13:00 schwarze Exp $ */
2f95d589eSschwarze /*
3a5e11edeSschwarze  * Copyright (c) 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv>
430c2fcb2Sschwarze  * Copyright (c) 2014,2015,2017,2018,2020 Ingo Schwarze <schwarze@openbsd.org>
5f95d589eSschwarze  *
6f95d589eSschwarze  * Permission to use, copy, modify, and distribute this software for any
7f95d589eSschwarze  * purpose with or without fee is hereby granted, provided that the above
8f95d589eSschwarze  * copyright notice and this permission notice appear in all copies.
9f95d589eSschwarze  *
102ccd0917Sschwarze  * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHORS DISCLAIM ALL WARRANTIES
11f95d589eSschwarze  * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
122ccd0917Sschwarze  * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR
13f95d589eSschwarze  * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
14f95d589eSschwarze  * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
15f95d589eSschwarze  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
16f95d589eSschwarze  * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
17f95d589eSschwarze  */
18f95d589eSschwarze #include <sys/types.h>
19f95d589eSschwarze 
206899db98Sschwarze #include <assert.h>
21414b1fadSschwarze #include <langinfo.h>
22a5e11edeSschwarze #include <locale.h>
23f95d589eSschwarze #include <stdint.h>
24f95d589eSschwarze #include <stdio.h>
25f95d589eSschwarze #include <stdlib.h>
26414b1fadSschwarze #include <string.h>
27f95d589eSschwarze #include <unistd.h>
28a5e11edeSschwarze #include <wchar.h>
29f95d589eSschwarze 
302791bd1cSschwarze #include "mandoc.h"
314f4f7972Sschwarze #include "mandoc_aux.h"
32f95d589eSschwarze #include "out.h"
33f95d589eSschwarze #include "term.h"
342ccd0917Sschwarze #include "manconf.h"
35f95d589eSschwarze #include "main.h"
36f95d589eSschwarze 
37ecf32ec4Sschwarze #define UTF8_LOCALE	"en_US.UTF-8"
38ecf32ec4Sschwarze 
3916536faaSschwarze static	struct termp	 *ascii_init(enum termenc, const struct manoutput *);
4013a35416Sschwarze static	int		  ascii_hspan(const struct termp *,
41769ee804Sschwarze 				const struct roffsu *);
42a5e11edeSschwarze static	size_t		  ascii_width(const struct termp *, int);
43769ee804Sschwarze static	void		  ascii_advance(struct termp *, size_t);
44769ee804Sschwarze static	void		  ascii_begin(struct termp *);
45769ee804Sschwarze static	void		  ascii_end(struct termp *);
46f95d589eSschwarze static	void		  ascii_endline(struct termp *);
47a5e11edeSschwarze static	void		  ascii_letter(struct termp *, int);
4813a35416Sschwarze static	void		  ascii_setwidth(struct termp *, int, int);
49f95d589eSschwarze 
50a5e11edeSschwarze static	void		  locale_advance(struct termp *, size_t);
51a5e11edeSschwarze static	void		  locale_endline(struct termp *);
52a5e11edeSschwarze static	void		  locale_letter(struct termp *, int);
53a5e11edeSschwarze static	size_t		  locale_width(const struct termp *, int);
54f95d589eSschwarze 
5549aff9f8Sschwarze 
56a5e11edeSschwarze static struct termp *
ascii_init(enum termenc enc,const struct manoutput * outopts)5716536faaSschwarze ascii_init(enum termenc enc, const struct manoutput *outopts)
58f95d589eSschwarze {
59f95d589eSschwarze 	char		*v;
60a5e11edeSschwarze 	struct termp	*p;
61f95d589eSschwarze 
62e93ea447Sschwarze 	p = mandoc_calloc(1, sizeof(*p));
63e93ea447Sschwarze 	p->tcol = p->tcols = mandoc_calloc(1, sizeof(*p->tcol));
64e93ea447Sschwarze 	p->maxtcol = 1;
65f95d589eSschwarze 
66c0a657b3Sschwarze 	p->line = 1;
67*84680f53Sschwarze 	p->defindent = 5;
685281506aSschwarze 	p->defrmargin = p->lastrmargin = 78;
69c48a0735Sschwarze 	p->fontq = mandoc_reallocarray(NULL,
70e93ea447Sschwarze 	     (p->fontsz = 8), sizeof(*p->fontq));
71c48a0735Sschwarze 	p->fontq[0] = p->fontl = TERMFONT_NONE;
723ebeb861Sschwarze 
73f95d589eSschwarze 	p->begin = ascii_begin;
74f95d589eSschwarze 	p->end = ascii_end;
75769ee804Sschwarze 	p->hspan = ascii_hspan;
76769ee804Sschwarze 	p->type = TERMTYPE_CHAR;
77a5e11edeSschwarze 
78a5e11edeSschwarze 	p->enc = TERMENC_ASCII;
79a5e11edeSschwarze 	p->advance = ascii_advance;
80a5e11edeSschwarze 	p->endline = ascii_endline;
81a5e11edeSschwarze 	p->letter = ascii_letter;
825281506aSschwarze 	p->setwidth = ascii_setwidth;
833ebeb861Sschwarze 	p->width = ascii_width;
84f95d589eSschwarze 
8553d61c88Sschwarze 	if (enc != TERMENC_ASCII) {
868621bbcaSschwarze 
878621bbcaSschwarze 		/*
888621bbcaSschwarze 		 * Do not change any of this to LC_ALL.  It might break
898621bbcaSschwarze 		 * the formatting by subtly changing the behaviour of
908621bbcaSschwarze 		 * various functions, for example strftime(3).  As a
918621bbcaSschwarze 		 * worst case, it might even cause buffer overflows.
928621bbcaSschwarze 		 */
938621bbcaSschwarze 
9453d61c88Sschwarze 		v = enc == TERMENC_LOCALE ?
958621bbcaSschwarze 		    setlocale(LC_CTYPE, "") :
96ecf32ec4Sschwarze 		    setlocale(LC_CTYPE, UTF8_LOCALE);
97414b1fadSschwarze 
98414b1fadSschwarze 		/*
99414b1fadSschwarze 		 * We only support UTF-8,
100414b1fadSschwarze 		 * so revert to ASCII for anything else.
101414b1fadSschwarze 		 */
102414b1fadSschwarze 
103414b1fadSschwarze 		if (v != NULL &&
104414b1fadSschwarze 		    strcmp(nl_langinfo(CODESET), "UTF-8") != 0)
105414b1fadSschwarze 			v = setlocale(LC_CTYPE, "C");
106414b1fadSschwarze 
107414b1fadSschwarze 		if (v != NULL && MB_CUR_MAX > 1) {
10853d61c88Sschwarze 			p->enc = TERMENC_UTF8;
109a5e11edeSschwarze 			p->advance = locale_advance;
110a5e11edeSschwarze 			p->endline = locale_endline;
111a5e11edeSschwarze 			p->letter = locale_letter;
112a5e11edeSschwarze 			p->width = locale_width;
113a5e11edeSschwarze 		}
114a5e11edeSschwarze 	}
115a5e11edeSschwarze 
116*84680f53Sschwarze 	if (outopts->mdoc)
117b6695f6fSschwarze 		p->mdocstyle = 1;
1182ccd0917Sschwarze 	if (outopts->indent)
1192ccd0917Sschwarze 		p->defindent = outopts->indent;
1202ccd0917Sschwarze 	if (outopts->width)
1212ccd0917Sschwarze 		p->defrmargin = outopts->width;
1222ccd0917Sschwarze 	if (outopts->synopsisonly)
1232ccd0917Sschwarze 		p->synopsisonly = 1;
124f95d589eSschwarze 
125fe245e6aSschwarze 	assert(p->defindent < UINT16_MAX);
126fe245e6aSschwarze 	assert(p->defrmargin < UINT16_MAX);
127526e306bSschwarze 	return p;
128f95d589eSschwarze }
129f95d589eSschwarze 
130a5e11edeSschwarze void *
ascii_alloc(const struct manoutput * outopts)13116536faaSschwarze ascii_alloc(const struct manoutput *outopts)
132a5e11edeSschwarze {
133a5e11edeSschwarze 
13416536faaSschwarze 	return ascii_init(TERMENC_ASCII, outopts);
135a5e11edeSschwarze }
136a5e11edeSschwarze 
137a5e11edeSschwarze void *
utf8_alloc(const struct manoutput * outopts)13816536faaSschwarze utf8_alloc(const struct manoutput *outopts)
139a5e11edeSschwarze {
140a5e11edeSschwarze 
14116536faaSschwarze 	return ascii_init(TERMENC_UTF8, outopts);
142a5e11edeSschwarze }
143a5e11edeSschwarze 
144a5e11edeSschwarze void *
locale_alloc(const struct manoutput * outopts)14516536faaSschwarze locale_alloc(const struct manoutput *outopts)
146a5e11edeSschwarze {
147a5e11edeSschwarze 
14816536faaSschwarze 	return ascii_init(TERMENC_LOCALE, outopts);
149a5e11edeSschwarze }
150f95d589eSschwarze 
1515281506aSschwarze static void
ascii_setwidth(struct termp * p,int iop,int width)15213a35416Sschwarze ascii_setwidth(struct termp *p, int iop, int width)
1535281506aSschwarze {
1545281506aSschwarze 
15513a35416Sschwarze 	width /= 24;
156e93ea447Sschwarze 	p->tcol->rmargin = p->defrmargin;
15799b0a561Sschwarze 	if (iop > 0)
15810111bf6Sschwarze 		p->defrmargin += width;
15999b0a561Sschwarze 	else if (iop == 0)
16013a35416Sschwarze 		p->defrmargin = width ? (size_t)width : p->lastrmargin;
16113a35416Sschwarze 	else if (p->defrmargin > (size_t)width)
16210111bf6Sschwarze 		p->defrmargin -= width;
16310111bf6Sschwarze 	else
16499b0a561Sschwarze 		p->defrmargin = 0;
165fe245e6aSschwarze 	if (p->defrmargin > 1000)
166fe245e6aSschwarze 		p->defrmargin = 1000;
167e93ea447Sschwarze 	p->lastrmargin = p->tcol->rmargin;
168e93ea447Sschwarze 	p->tcol->rmargin = p->maxrmargin = p->defrmargin;
1695281506aSschwarze }
1705281506aSschwarze 
1712b036407Sschwarze void
terminal_sepline(void * arg)1722db2cb23Sschwarze terminal_sepline(void *arg)
1732b036407Sschwarze {
1742b036407Sschwarze 	struct termp	*p;
1752b036407Sschwarze 	size_t		 i;
1762b036407Sschwarze 
1772b036407Sschwarze 	p = (struct termp *)arg;
1782db2cb23Sschwarze 	(*p->endline)(p);
1792b036407Sschwarze 	for (i = 0; i < p->defrmargin; i++)
1802db2cb23Sschwarze 		(*p->letter)(p, '-');
1812db2cb23Sschwarze 	(*p->endline)(p);
1822db2cb23Sschwarze 	(*p->endline)(p);
1832b036407Sschwarze }
1842b036407Sschwarze 
1853ebeb861Sschwarze static size_t
ascii_width(const struct termp * p,int c)186a5e11edeSschwarze ascii_width(const struct termp *p, int c)
1873ebeb861Sschwarze {
18818bbf166Sschwarze 	return c != ASCII_BREAK && c != ASCII_NBRZW && c != ASCII_TABREF;
1893ebeb861Sschwarze }
1903ebeb861Sschwarze 
191f95d589eSschwarze void
ascii_free(void * arg)192f95d589eSschwarze ascii_free(void *arg)
193f95d589eSschwarze {
194f95d589eSschwarze 
195f95d589eSschwarze 	term_free((struct termp *)arg);
196f95d589eSschwarze }
197f95d589eSschwarze 
198f95d589eSschwarze static void
ascii_letter(struct termp * p,int c)199a5e11edeSschwarze ascii_letter(struct termp *p, int c)
200f95d589eSschwarze {
201f95d589eSschwarze 
202f95d589eSschwarze 	putchar(c);
203f95d589eSschwarze }
204f95d589eSschwarze 
205f95d589eSschwarze static void
ascii_begin(struct termp * p)206f95d589eSschwarze ascii_begin(struct termp *p)
207f95d589eSschwarze {
208f95d589eSschwarze 
209f95d589eSschwarze 	(*p->headf)(p, p->argf);
210f95d589eSschwarze }
211f95d589eSschwarze 
212f95d589eSschwarze static void
ascii_end(struct termp * p)213f95d589eSschwarze ascii_end(struct termp *p)
214f95d589eSschwarze {
215f95d589eSschwarze 
216f95d589eSschwarze 	(*p->footf)(p, p->argf);
217f95d589eSschwarze }
218f95d589eSschwarze 
219f95d589eSschwarze static void
ascii_endline(struct termp * p)220f95d589eSschwarze ascii_endline(struct termp *p)
221f95d589eSschwarze {
222f95d589eSschwarze 
223c0a657b3Sschwarze 	p->line++;
22430c2fcb2Sschwarze 	if ((int)p->tcol->offset > p->ti)
225e93ea447Sschwarze 		p->tcol->offset -= p->ti;
22630c2fcb2Sschwarze 	else
22730c2fcb2Sschwarze 		p->tcol->offset = 0;
22811d70615Sschwarze 	p->ti = 0;
229f95d589eSschwarze 	putchar('\n');
230f95d589eSschwarze }
231f95d589eSschwarze 
232f95d589eSschwarze static void
ascii_advance(struct termp * p,size_t len)233f95d589eSschwarze ascii_advance(struct termp *p, size_t len)
234f95d589eSschwarze {
235f95d589eSschwarze 	size_t		i;
236f95d589eSschwarze 
237b19a7d95Sschwarze 	/*
238b19a7d95Sschwarze 	 * XXX We used to have "assert(len < UINT16_MAX)" here.
239b19a7d95Sschwarze 	 * that is not quite right because the input document
240b19a7d95Sschwarze 	 * can trigger that by merely providing large input.
241b19a7d95Sschwarze 	 * For now, simply truncate.
242b19a7d95Sschwarze 	 */
243b19a7d95Sschwarze 	if (len > 256)
244b19a7d95Sschwarze 		len = 256;
245f95d589eSschwarze 	for (i = 0; i < len; i++)
246f95d589eSschwarze 		putchar(' ');
247f95d589eSschwarze }
248769ee804Sschwarze 
24913a35416Sschwarze static int
ascii_hspan(const struct termp * p,const struct roffsu * su)250769ee804Sschwarze ascii_hspan(const struct termp *p, const struct roffsu *su)
251769ee804Sschwarze {
252769ee804Sschwarze 	double		 r;
253769ee804Sschwarze 
254769ee804Sschwarze 	switch (su->unit) {
255d5dc6f2eSschwarze 	case SCALE_BU:
25613a35416Sschwarze 		r = su->scale;
257d5dc6f2eSschwarze 		break;
25849aff9f8Sschwarze 	case SCALE_CM:
25913a35416Sschwarze 		r = su->scale * 240.0 / 2.54;
260d5dc6f2eSschwarze 		break;
261d5dc6f2eSschwarze 	case SCALE_FS:
26213a35416Sschwarze 		r = su->scale * 65536.0;
263769ee804Sschwarze 		break;
26449aff9f8Sschwarze 	case SCALE_IN:
26513a35416Sschwarze 		r = su->scale * 240.0;
266769ee804Sschwarze 		break;
267d5dc6f2eSschwarze 	case SCALE_MM:
26813a35416Sschwarze 		r = su->scale * 0.24;
269769ee804Sschwarze 		break;
27049aff9f8Sschwarze 	case SCALE_VS:
27113a35416Sschwarze 	case SCALE_PC:
27213a35416Sschwarze 		r = su->scale * 40.0;
27313a35416Sschwarze 		break;
27413a35416Sschwarze 	case SCALE_PT:
27513a35416Sschwarze 		r = su->scale * 10.0 / 3.0;
276769ee804Sschwarze 		break;
277d5dc6f2eSschwarze 	case SCALE_EN:
278d5dc6f2eSschwarze 	case SCALE_EM:
27913a35416Sschwarze 		r = su->scale * 24.0;
280769ee804Sschwarze 		break;
2814ffbec5dSschwarze 	default:
282d5dc6f2eSschwarze 		abort();
283769ee804Sschwarze 	}
284526e306bSschwarze 	return r > 0.0 ? r + 0.01 : r - 0.01;
285769ee804Sschwarze }
286769ee804Sschwarze 
28755f79d48Sschwarze const char *
ascii_uc2str(int uc)28855f79d48Sschwarze ascii_uc2str(int uc)
28955f79d48Sschwarze {
29055f79d48Sschwarze 	static const char nbrsp[2] = { ASCII_NBRSP, '\0' };
29155f79d48Sschwarze 	static const char *tab[] = {
29255f79d48Sschwarze 	"<NUL>","<SOH>","<STX>","<ETX>","<EOT>","<ENQ>","<ACK>","<BEL>",
29355f79d48Sschwarze 	"<BS>",	"\t",	"<LF>",	"<VT>",	"<FF>",	"<CR>",	"<SO>",	"<SI>",
29455f79d48Sschwarze 	"<DLE>","<DC1>","<DC2>","<DC3>","<DC4>","<NAK>","<SYN>","<ETB>",
29555f79d48Sschwarze 	"<CAN>","<EM>",	"<SUB>","<ESC>","<FS>",	"<GS>",	"<RS>",	"<US>",
29655f79d48Sschwarze 	" ",	"!",	"\"",	"#",	"$",	"%",	"&",	"'",
29755f79d48Sschwarze 	"(",	")",	"*",	"+",	",",	"-",	".",	"/",
29855f79d48Sschwarze 	"0",	"1",	"2",	"3",	"4",	"5",	"6",	"7",
29955f79d48Sschwarze 	"8",	"9",	":",	";",	"<",	"=",	">",	"?",
30055f79d48Sschwarze 	"@",	"A",	"B",	"C",	"D",	"E",	"F",	"G",
30155f79d48Sschwarze 	"H",	"I",	"J",	"K",	"L",	"M",	"N",	"O",
30255f79d48Sschwarze 	"P",	"Q",	"R",	"S",	"T",	"U",	"V",	"W",
30355f79d48Sschwarze 	"X",	"Y",	"Z",	"[",	"\\",	"]",	"^",	"_",
30455f79d48Sschwarze 	"`",	"a",	"b",	"c",	"d",	"e",	"f",	"g",
30555f79d48Sschwarze 	"h",	"i",	"j",	"k",	"l",	"m",	"n",	"o",
30655f79d48Sschwarze 	"p",	"q",	"r",	"s",	"t",	"u",	"v",	"w",
30755f79d48Sschwarze 	"x",	"y",	"z",	"{",	"|",	"}",	"~",	"<DEL>",
30855f79d48Sschwarze 	"<80>",	"<81>",	"<82>",	"<83>",	"<84>",	"<85>",	"<86>",	"<87>",
30955f79d48Sschwarze 	"<88>",	"<89>",	"<8A>",	"<8B>",	"<8C>",	"<8D>",	"<8E>",	"<8F>",
31055f79d48Sschwarze 	"<90>",	"<91>",	"<92>",	"<93>",	"<94>",	"<95>",	"<96>",	"<97>",
3118ac50ec5Sschwarze 	"<98>",	"<99>",	"<9A>",	"<9B>",	"<9C>",	"<9D>",	"<9E>",	"<9F>",
312f09271baSschwarze 	nbrsp,	"!",	"/\bc",	"-\bL",	"o\bx",	"=\bY",	"|",	"<section>",
313d8d0d815Sschwarze 	"\"",	"(C)",	"_\ba",	"<<",	"~",	"",	"(R)",	"-",
314c250368cSschwarze 	"<degree>","+-","^2",	"^3",	"'","<micro>","<paragraph>",".",
315c250368cSschwarze 	",",	"^1",	"_\bo",	">>",	"1/4",	"1/2",	"3/4",	"?",
316d8d0d815Sschwarze 	"`\bA",	"'\bA",	"^\bA",	"~\bA",	"\"\bA","o\bA",	"AE",	",\bC",
317d8d0d815Sschwarze 	"`\bE",	"'\bE",	"^\bE",	"\"\bE","`\bI",	"'\bI",	"^\bI",	"\"\bI",
318c250368cSschwarze 	"Dh",	"~\bN",	"`\bO",	"'\bO",	"^\bO",	"~\bO",	"\"\bO","x",
319d8d0d815Sschwarze 	"/\bO",	"`\bU",	"'\bU",	"^\bU",	"\"\bU","'\bY",	"Th",	"ss",
320d8d0d815Sschwarze 	"`\ba",	"'\ba",	"^\ba",	"~\ba",	"\"\ba","o\ba",	"ae",	",\bc",
321d8d0d815Sschwarze 	"`\be",	"'\be",	"^\be",	"\"\be","`\bi",	"'\bi",	"^\bi",	"\"\bi",
322c250368cSschwarze 	"dh",	"~\bn",	"`\bo",	"'\bo",	"^\bo",	"~\bo",	"\"\bo","/",
323d8d0d815Sschwarze 	"/\bo",	"`\bu",	"'\bu",	"^\bu",	"\"\bu","'\by",	"th",	"\"\by",
324d8d0d815Sschwarze 	"A",	"a",	"A",	"a",	"A",	"a",	"'\bC",	"'\bc",
325d8d0d815Sschwarze 	"^\bC",	"^\bc",	"C",	"c",	"C",	"c",	"D",	"d",
326d8d0d815Sschwarze 	"/\bD",	"/\bd",	"E",	"e",	"E",	"e",	"E",	"e",
327d8d0d815Sschwarze 	"E",	"e",	"E",	"e",	"^\bG",	"^\bg",	"G",	"g",
328d8d0d815Sschwarze 	"G",	"g",	",\bG",	",\bg",	"^\bH",	"^\bh",	"/\bH",	"/\bh",
329d8d0d815Sschwarze 	"~\bI",	"~\bi",	"I",	"i",	"I",	"i",	"I",	"i",
330d8d0d815Sschwarze 	"I",	"i",	"IJ",	"ij",	"^\bJ",	"^\bj",	",\bK",	",\bk",
331d8d0d815Sschwarze 	"q",	"'\bL",	"'\bl",	",\bL",	",\bl",	"L",	"l",	"L",
332d8d0d815Sschwarze 	"l",	"/\bL",	"/\bl",	"'\bN",	"'\bn",	",\bN",	",\bn",	"N",
33355f79d48Sschwarze 	"n",	"'n",	"Ng",	"ng",	"O",	"o",	"O",	"o",
334d8d0d815Sschwarze 	"O",	"o",	"OE",	"oe",	"'\bR",	"'\br",	",\bR",	",\br",
335d8d0d815Sschwarze 	"R",	"r",	"'\bS",	"'\bs",	"^\bS",	"^\bs",	",\bS",	",\bs",
336d8d0d815Sschwarze 	"S",	"s",	",\bT",	",\bt",	"T",	"t",	"/\bT",	"/\bt",
337d8d0d815Sschwarze 	"~\bU",	"~\bu",	"U",	"u",	"U",	"u",	"U",	"u",
338d8d0d815Sschwarze 	"U",	"u",	"U",	"u",	"^\bW",	"^\bw",	"^\bY",	"^\by",
339d8d0d815Sschwarze 	"\"\bY","'\bZ",	"'\bz",	"Z",	"z",	"Z",	"z",	"s",
34055f79d48Sschwarze 	"b",	"B",	"B",	"b",	"6",	"6",	"O",	"C",
34155f79d48Sschwarze 	"c",	"D",	"D",	"D",	"d",	"d",	"3",	"@",
342d8d0d815Sschwarze 	"E",	"F",	",\bf",	"G",	"G",	"hv",	"I",	"/\bI",
343d8d0d815Sschwarze 	"K",	"k",	"/\bl",	"l",	"W",	"N",	"n",	"~\bO",
34455f79d48Sschwarze 	"O",	"o",	"OI",	"oi",	"P",	"p",	"YR",	"2",
34555f79d48Sschwarze 	"2",	"SH",	"sh",	"t",	"T",	"t",	"T",	"U",
346d8d0d815Sschwarze 	"u",	"Y",	"V",	"Y",	"y",	"/\bZ",	"/\bz",	"ZH",
347d8d0d815Sschwarze 	"ZH",	"zh",	"zh",	"/\b2",	"5",	"5",	"ts",	"w",
34855f79d48Sschwarze 	"|",	"||",	"|=",	"!",	"DZ",	"Dz",	"dz",	"LJ",
34955f79d48Sschwarze 	"Lj",	"lj",	"NJ",	"Nj",	"nj",	"A",	"a",	"I",
35055f79d48Sschwarze 	"i",	"O",	"o",	"U",	"u",	"U",	"u",	"U",
35155f79d48Sschwarze 	"u",	"U",	"u",	"U",	"u",	"@",	"A",	"a",
352d8d0d815Sschwarze 	"A",	"a",	"AE",	"ae",	"/\bG",	"/\bg",	"G",	"g",
35355f79d48Sschwarze 	"K",	"k",	"O",	"o",	"O",	"o",	"ZH",	"zh",
354d8d0d815Sschwarze 	"j",	"DZ",	"Dz",	"dz",	"'\bG",	"'\bg",	"HV",	"W",
355d8d0d815Sschwarze 	"`\bN",	"`\bn",	"A",	"a",	"'\bAE","'\bae","O",	"o"};
35655f79d48Sschwarze 
3576899db98Sschwarze 	assert(uc >= 0);
358ed5ebdbaSschwarze 	if ((size_t)uc < sizeof(tab)/sizeof(tab[0]))
359526e306bSschwarze 		return tab[uc];
360526e306bSschwarze 	return mchars_uc2str(uc);
36155f79d48Sschwarze }
36255f79d48Sschwarze 
363a5e11edeSschwarze static size_t
locale_width(const struct termp * p,int c)364a5e11edeSschwarze locale_width(const struct termp *p, int c)
365a5e11edeSschwarze {
366a5e11edeSschwarze 	int		rc;
367a5e11edeSschwarze 
368c9fd5525Sschwarze 	if (c == ASCII_NBRSP)
369c9fd5525Sschwarze 		c = ' ';
370c9fd5525Sschwarze 	rc = wcwidth(c);
371c9fd5525Sschwarze 	if (rc < 0)
372c9fd5525Sschwarze 		rc = 0;
373526e306bSschwarze 	return rc;
374a5e11edeSschwarze }
375a5e11edeSschwarze 
376a5e11edeSschwarze static void
locale_advance(struct termp * p,size_t len)377a5e11edeSschwarze locale_advance(struct termp *p, size_t len)
378a5e11edeSschwarze {
379a5e11edeSschwarze 	size_t		i;
380a5e11edeSschwarze 
381b19a7d95Sschwarze 	/*
382b19a7d95Sschwarze 	 * XXX We used to have "assert(len < UINT16_MAX)" here.
383b19a7d95Sschwarze 	 * that is not quite right because the input document
384b19a7d95Sschwarze 	 * can trigger that by merely providing large input.
385b19a7d95Sschwarze 	 * For now, simply truncate.
386b19a7d95Sschwarze 	 */
387b19a7d95Sschwarze 	if (len > 256)
388b19a7d95Sschwarze 		len = 256;
389a5e11edeSschwarze 	for (i = 0; i < len; i++)
390a5e11edeSschwarze 		putwchar(L' ');
391a5e11edeSschwarze }
392a5e11edeSschwarze 
393a5e11edeSschwarze static void
locale_endline(struct termp * p)394a5e11edeSschwarze locale_endline(struct termp *p)
395a5e11edeSschwarze {
396a5e11edeSschwarze 
397c0a657b3Sschwarze 	p->line++;
39830c2fcb2Sschwarze 	if ((int)p->tcol->offset > p->ti)
399e93ea447Sschwarze 		p->tcol->offset -= p->ti;
40030c2fcb2Sschwarze 	else
40130c2fcb2Sschwarze 		p->tcol->offset = 0;
40211d70615Sschwarze 	p->ti = 0;
403a5e11edeSschwarze 	putwchar(L'\n');
404a5e11edeSschwarze }
405a5e11edeSschwarze 
406a5e11edeSschwarze static void
locale_letter(struct termp * p,int c)407a5e11edeSschwarze locale_letter(struct termp *p, int c)
408a5e11edeSschwarze {
409a5e11edeSschwarze 
410a5e11edeSschwarze 	putwchar(c);
411a5e11edeSschwarze }
412