debug.c revision 1.16
1/*	$NetBSD: debug.c,v 1.16 2023/05/20 10:09:02 rillig Exp $	*/
2
3/*-
4 * Copyright (c) 2023 The NetBSD Foundation, Inc.
5 * All rights reserved.
6 *
7 * This code is derived from software contributed to The NetBSD Foundation
8 * by Roland Illig <rillig@NetBSD.org>.
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 * 1. Redistributions of source code must retain the above copyright
14 *    notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 *    notice, this list of conditions and the following disclaimer in the
17 *    documentation and/or other materials provided with the distribution.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 * POSSIBILITY OF SUCH DAMAGE.
30 */
31
32#include <sys/cdefs.h>
33__RCSID("$NetBSD: debug.c,v 1.16 2023/05/20 10:09:02 rillig Exp $");
34
35#include <stdarg.h>
36
37#include "indent.h"
38
39#ifdef debug
40
41/*-
42 * false	show only the changes to the parser state
43 * true		show unchanged parts of the parser state as well
44 */
45static bool debug_full_parser_state = true;
46
47const char *const lsym_name[] = {
48	"eof",
49	"preprocessing",
50	"newline",
51	"comment",
52	"lparen_or_lbracket",
53	"rparen_or_rbracket",
54	"lbrace",
55	"rbrace",
56	"period",
57	"unary_op",
58	"binary_op",
59	"postfix_op",
60	"question",
61	"colon",
62	"comma",
63	"semicolon",
64	"typedef",
65	"storage_class",
66	"type_outside_parentheses",
67	"type_in_parentheses",
68	"tag",
69	"case_label",
70	"sizeof",
71	"offsetof",
72	"word",
73	"funcname",
74	"do",
75	"else",
76	"for",
77	"if",
78	"switch",
79	"while",
80	"return",
81};
82
83const char *const psym_name[] = {
84	"0",
85	"lbrace",
86	"rbrace",
87	"decl",
88	"stmt",
89	"stmt_list",
90	"for_exprs",
91	"if_expr",
92	"if_expr_stmt",
93	"if_expr_stmt_else",
94	"else",
95	"switch_expr",
96	"do",
97	"do_stmt",
98	"while_expr",
99};
100
101static const char *const declaration_name[] = {
102	"no",
103	"begin",
104	"end",
105};
106
107static const char *const in_enum_name[] = {
108	"no",
109	"enum",
110	"type",
111	"brace",
112};
113
114const char *const paren_level_cast_name[] = {
115	"(unknown cast)",
116	"(maybe cast)",
117	"(no cast)",
118};
119
120static const char *const line_kind_name[] = {
121	"other",
122	"#if",
123	"#endif",
124};
125
126void
127debug_printf(const char *fmt, ...)
128{
129	FILE *f = output == stdout ? stderr : stdout;
130	va_list ap;
131
132	va_start(ap, fmt);
133	vfprintf(f, fmt, ap);
134	va_end(ap);
135}
136
137void
138debug_println(const char *fmt, ...)
139{
140	FILE *f = output == stdout ? stderr : stdout;
141	va_list ap;
142
143	va_start(ap, fmt);
144	vfprintf(f, fmt, ap);
145	va_end(ap);
146	fprintf(f, "\n");
147}
148
149void
150debug_vis_range(const char *prefix, const char *s, size_t len,
151    const char *suffix)
152{
153	debug_printf("%s", prefix);
154	for (size_t i = 0; i < len; i++) {
155		const char *p = s + i;
156		if (*p == '\\' || *p == '"')
157			debug_printf("\\%c", *p);
158		else if (isprint((unsigned char)*p))
159			debug_printf("%c", *p);
160		else if (*p == '\n')
161			debug_printf("\\n");
162		else if (*p == '\t')
163			debug_printf("\\t");
164		else
165			debug_printf("\\x%02x", (unsigned char)*p);
166	}
167	debug_printf("%s", suffix);
168}
169
170static void
171debug_print_buf(const char *name, const struct buffer *buf)
172{
173	if (buf->len > 0) {
174		debug_printf("%s ", name);
175		debug_vis_range("\"", buf->st, buf->len, "\"\n");
176	}
177}
178
179void
180debug_buffers(void)
181{
182	if (lab.len > 0) {
183		debug_printf(" label ");
184		debug_vis_range("\"", lab.st, lab.len, "\"");
185	}
186	if (code.len > 0) {
187		debug_printf(" code ");
188		debug_vis_range("\"", code.st, code.len, "\"");
189	}
190	if (com.len > 0) {
191		debug_printf(" comment ");
192		debug_vis_range("\"", com.st, com.len, "\"");
193	}
194}
195
196#define debug_ps_bool(name) \
197	if (ps.name != prev_ps.name) \
198	    debug_println("[%c] -> [%c] ps." #name, \
199		prev_ps.name ? 'x' : ' ', ps.name ? 'x' : ' '); \
200	else if (debug_full_parser_state) \
201	    debug_println("       [%c] ps." #name, ps.name ? 'x' : ' ')
202#define debug_ps_int(name) \
203	if (ps.name != prev_ps.name) \
204	    debug_println("%3d -> %3d ps." #name, prev_ps.name, ps.name); \
205	else if (debug_full_parser_state) \
206	    debug_println("       %3d ps." #name, ps.name)
207#define debug_ps_enum(name, names) \
208	if (ps.name != prev_ps.name) \
209	    debug_println("%3s -> %3s ps." #name, \
210		(names)[prev_ps.name], (names)[ps.name]); \
211	else if (debug_full_parser_state) \
212	    debug_println("%10s ps." #name, (names)[ps.name])
213
214static bool
215ps_paren_has_changed(const struct parser_state *prev_ps)
216{
217	if (prev_ps->nparen != ps.nparen)
218		return true;
219
220	const paren_level_props *prev = prev_ps->paren, *curr = ps.paren;
221	for (int i = 0; i < ps.nparen; i++)
222		if (curr[i].indent != prev[i].indent
223		    || curr[i].cast != prev[i].cast)
224			return true;
225	return false;
226}
227
228static void
229debug_ps_paren(const struct parser_state *prev_ps)
230{
231	if (!debug_full_parser_state && !ps_paren_has_changed(prev_ps))
232		return;
233
234	debug_printf("           ps.paren:");
235	for (int i = 0; i < ps.nparen; i++) {
236		debug_printf(" %s%d",
237		    paren_level_cast_name[ps.paren[i].cast],
238		    ps.paren[i].indent);
239	}
240	if (ps.nparen == 0)
241		debug_printf(" none");
242	debug_println("");
243}
244
245static bool
246ps_di_stack_has_changed(const struct parser_state *prev_ps)
247{
248	if (prev_ps->decl_level != ps.decl_level)
249		return true;
250	for (int i = 0; i < ps.decl_level; i++)
251		if (prev_ps->di_stack[i] != ps.di_stack[i])
252			return true;
253	return false;
254}
255
256static void
257debug_ps_di_stack(const struct parser_state *prev_ps)
258{
259	bool changed = ps_di_stack_has_changed(prev_ps);
260	if (!debug_full_parser_state && !changed)
261		return;
262
263	debug_printf("    %s     ps.di_stack:", changed ? "->" : "  ");
264	for (int i = 0; i < ps.decl_level; i++)
265		debug_printf(" %d", ps.di_stack[i]);
266	if (ps.decl_level == 0)
267		debug_printf(" none");
268	debug_println("");
269}
270
271void
272debug_parser_state(lexer_symbol lsym)
273{
274	static struct parser_state prev_ps;
275
276	debug_println("");
277	debug_printf("line %d: %s", line_no, lsym_name[lsym]);
278	debug_vis_range(" \"", token.st, token.len, "\"\n");
279
280	debug_print_buf("label", &lab);
281	debug_print_buf("code", &code);
282	debug_print_buf("comment", &com);
283
284	debug_println("           ps.prev_token = %s",
285	    lsym_name[ps.prev_token]);
286	debug_ps_bool(curr_col_1);
287	debug_ps_bool(next_col_1);
288	debug_ps_bool(next_unary);
289	debug_ps_bool(is_function_definition);
290	debug_ps_bool(want_blank);
291	debug_ps_bool(force_nl);
292	debug_ps_int(line_start_nparen);
293	debug_ps_int(nparen);
294	debug_ps_paren(&prev_ps);
295
296	debug_ps_int(comment_delta);
297	debug_ps_int(n_comment_delta);
298	debug_ps_int(com_ind);
299
300	debug_ps_bool(block_init);
301	debug_ps_int(block_init_level);
302	debug_ps_bool(init_or_struct);
303
304	debug_ps_int(ind_level);
305	debug_ps_int(ind_level_follow);
306
307	debug_ps_int(decl_level);
308	debug_ps_di_stack(&prev_ps);
309	debug_ps_bool(decl_on_line);
310	debug_ps_bool(in_decl);
311	debug_ps_enum(declaration, declaration_name);
312	debug_ps_bool(blank_line_after_decl);
313	debug_ps_bool(in_func_def_params);
314	debug_ps_enum(in_enum, in_enum_name);
315	debug_ps_bool(decl_indent_done);
316	debug_ps_int(decl_ind);
317	debug_ps_bool(tabs_to_var);
318
319	debug_ps_bool(in_stmt_or_decl);
320	debug_ps_bool(in_stmt_cont);
321	debug_ps_bool(is_case_label);
322	debug_ps_bool(seen_case);
323
324	// The debug output for the parser symbols is done in 'parse' instead.
325
326	debug_ps_enum(spaced_expr_psym, psym_name);
327	debug_ps_int(quest_level);
328
329	debug_ps_enum(line_kind, line_kind_name);
330	debug_ps_enum(prev_line_kind, line_kind_name);
331
332	prev_ps = ps;
333}
334
335void
336debug_parse_stack(const char *situation)
337{
338	printf("parse stack %s:", situation);
339	for (int i = 1; i <= ps.tos; ++i)
340		printf(" %s %d", psym_name[ps.s_sym[i]], ps.s_ind_level[i]);
341	if (ps.tos == 0)
342		printf(" empty");
343	printf("\n");
344}
345#endif
346