@@ -1,205 +1,205 @@
-/* $NetBSD: lsym_binary_op.c,v 1.11 2023/06/04 22:57:18 rillig Exp $ */
+/* $NetBSD: lsym_binary_op.c,v 1.12 2023/06/14 08:25:15 rillig Exp $ */
 /*
  * Tests for the token lsym_binary_op, which represents a binary operator in
  * an expression.  Examples for binary operators are '>>', '=', '+', '&&'.
+ *
  * Binary operators are surrounded by blanks.
+ *
  * Some tokens like '+', '*' or '&' can be either binary or unary operators,
  * with an entirely different meaning.
+ *
  * The token '*' is not only a binary or a unary operator, it is used in types
  * as well, to derive a pointer type.
+ *
  * See also:
  *	lsym_postfix_op.c	for postfix unary operators
  *	lsym_unary_op.c		for prefix unary operators
  *	lsym_colon.c		for ':'
  *	lsym_question.c		for '?'
  *	lsym_comma.c		for ','
  *	C99 6.4.6		"Punctuators"
  */
 //indent input
 void
 binary_operators(void)
+{
 	/* In the order of appearance in C11 6.5. */
 	a = a * a;
 	a = a / a;
 	a = a % a;
 	a = a + a;
 	a = a - a;
 	a = a << a;
 	a = a >> a;
 	a = a < a;
 	a = a > a;
 	a = a <= a;
 	a = a >= a;
 	a = a == a;
 	a = a != a;
 	a = a & a;
 	a = a ^ a;
 	a = a | a;
 	a = a && a;
 	a = a || a;
 	a = a ? a : a;
 	a = a;
 	a *= a;
 	a /= a;
 	a %= a;
 	a += a;
 	a -= a;
 	a <<= a;
 	a >>= a;
 	a &= a;
 	a ^= a;
 	a |= a;
 	a = a, a;
+}
 //indent end
 //indent run-equals-input
 /*
  * If a '*' is immediately followed by another '*', they still form separate
  * operators. The first is a binary operator, the second is unary.
  */
 //indent input
 int var = expr**ptr;
 //indent end
 //indent run -di0
 int var = expr * *ptr;
 //indent end
 /*
  * Before 2023-06-04, indent allowed for arbitrary repetitions of some operator
  * characters, followed by an arbitrary amount of '='.  This could be used for
  * operators like '&&' or '|||==='.
+ *
  * Before 2021-03-07 22:11:01, the comment '//' was treated as a binary
  * operator as well, and so was the comment '/////', leading to unexpected
  * spacing.
+ *
  * See lexi.c, lexi, "default:".
  */
 //indent input
 void
 long_run_of_operators(void)
+{
 	if (a &&&&&&& b)
 		return;
 	if (a |||=== b)
 		return;
+}
 //indent end
 //indent run
 void
 long_run_of_operators(void)
+{
 	if (a && && && &b)
 		return;
 	if (a || |= == b)
 		return;
+}
 //indent end
 /*
  * Long chains of '+' and '-' must be split into several operators as the
  * lexer has to distinguish between '++' and '+' early.  The following
  * sequence is thus tokenized as:
+ *
  *	word		"a"
  *	postfix_op	"++"
  *	binary_op	"++"
  *	unary_op	"++"
  *	unary_op	"+"
  *	word		"b"
+ *
  * See lexi.c, lexi, "case '+':".
  */
 //indent input
 void
 joined_unary_and_binary_operators(void)
+{
 	if (a +++++++ b)
 		return;
+}
 //indent end
 //indent run
 void
 joined_unary_and_binary_operators(void)
+{
 	if (a++ ++ ++ +b)
 		return;
+}
 //indent end
 /*
  * Ensure that the result of the indentation does not depend on whether a
  * token from the input starts in column 1 or 9.
+ *
- * See process_binary_op, ps.curr_col_1.
+ * See process_binary_op.
  */
 //indent input
 int col_1 //
 = //
 ;
 int col_9 //
 	= //
 ;
 //indent end
 //indent run
 int		col_1		//
 =				//
 ;
 int		col_9		//
 =				//
 ;
 //indent end
 /*
  * The ternary conditional operator is not a binary operator, but both its
  * components '?' and ':' follow the same spacing rules.
  */
 //indent input
 int conditional = condition ? number : number;
 //indent end
 //indent run-equals-input -di0
 // After a ']', a '*' is a binary operator.
 //indent input
 int x = arr[3]*y;
 //indent end
 //indent run -di0
 int x = arr[3] * y;
 //indent end
 /*
  * Ensure that after an assignment, a '*=' operator is properly spaced, like
  * any other binary operator.
  */
 //indent input
+{
 	a = a;
 	a *= b *= c;
+}
 //indent end
 //indent run-equals-input -di0

 @@ -1,398 +1,397 @@
-/*	$NetBSD: debug.c,v 1.54 2023/06/14 07:20:55 rillig Exp $	*/
+/*	$NetBSD: debug.c,v 1.55 2023/06/14 08:25:15 rillig Exp $	*/
 /*-
  * Copyright (c) 2023 The NetBSD Foundation, Inc.
  * All rights reserved.
+ *
  * This code is derived from software contributed to The NetBSD Foundation
  * by Roland Illig <rillig@NetBSD.org>.
+ *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
+ *
  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  * POSSIBILITY OF SUCH DAMAGE.
  */
 #include <sys/cdefs.h>
-__RCSID("$NetBSD: debug.c,v 1.54 2023/06/14 07:20:55 rillig Exp $");
+__RCSID("$NetBSD: debug.c,v 1.55 2023/06/14 08:25:15 rillig Exp $");
 #include <stdarg.h>
 #include <string.h>
 #include "indent.h"
 #ifdef debug
 static struct {
 	/*-
 	 * false	show only the changes to the parser state
 	 * true		show unchanged parts of the parser state as well
 	 */
 	bool full_parser_state;
 } config = {
 	.full_parser_state = false,
 };
 const char *const lsym_name[] = {
 	"eof",
 	"preprocessing",
 	"newline",
 	"comment",
 	"lparen",
 	"rparen",
 	"lbracket",
 	"rbracket",
 	"lbrace",
 	"rbrace",
 	"period",
 	"unary_op",
 	"sizeof",
 	"offsetof",
 	"postfix_op",
 	"binary_op",
 	"question",
 	"question_colon",
 	"comma",
 	"typedef",
 	"modifier",
 	"tag",
 	"type_outside_parentheses",
 	"type_in_parentheses",
 	"word",
 	"funcname",
 	"label_colon",
 	"other_colon",
 	"semicolon",
 	"case",
 	"default",
 	"do",
 	"else",
 	"for",
 	"if",
 	"switch",
 	"while",
 	"return",
 };
 const char *const psym_name[] = {
 	"-",
 	"{block",
 	"{struct",
 	"{union",
 	"{enum",
 	"}",
 	"decl",
 	"stmt",
 	"for_exprs",
 	"if_expr",
 	"if_expr_stmt",
 	"if_expr_stmt_else",
 	"else",
 	"switch_expr",
 	"do",
 	"do_stmt",
 	"while_expr",
 };
 static const char *const declaration_name[] = {
 	"no",
 	"begin",
 	"end",
 };
 const char *const paren_level_cast_name[] = {
 	"(unknown cast)",
 	"(maybe cast)",
 	"(no cast)",
 };
 const char *const line_kind_name[] = {
 	"other",
 	"blank",
 	"#if",
 	"#endif",
 	"stmt head",
 	"}",
 	"block comment",
 	"case/default",
 };
 static const char *const extra_expr_indent_name[] = {
 	"no",
 	"maybe",
 	"last",
 };
 static struct {
 	struct parser_state prev_ps;
 	bool ps_first;
 	const char *heading;
 	unsigned wrote_newlines;
 } state = {
 	.ps_first = true,
 	.wrote_newlines = 1,
 };
 void
 debug_printf(const char *fmt, ...)
+{
 	FILE *f = output == stdout ? stderr : stdout;
 	va_list ap;
 	if (state.heading != NULL) {
 		fprintf(f, "%s\n", state.heading);
 		state.heading = NULL;
+	}
 	va_start(ap, fmt);
 	vfprintf(f, fmt, ap);
 	va_end(ap);
 	state.wrote_newlines = 0;
+}
 void
 debug_println(const char *fmt, ...)
+{
 	FILE *f = output == stdout ? stderr : stdout;
 	va_list ap;
 	if (state.heading != NULL) {
 		fprintf(f, "%s\n", state.heading);
 		state.heading = NULL;
 		state.wrote_newlines = 1;
+	}
 	va_start(ap, fmt);
 	vfprintf(f, fmt, ap);
 	va_end(ap);
 	fprintf(f, "\n");
 	state.wrote_newlines = fmt[0] == '\0' ? state.wrote_newlines + 1 : 1;
+}
 void
 debug_blank_line(void)
+{
 	while (state.wrote_newlines < 2)
 		debug_println("");
+}
 void
 debug_vis_range(const char *prefix, const char *s, size_t len,
     const char *suffix)
+{
 	debug_printf("%s", prefix);
 	for (size_t i = 0; i < len; i++) {
 		const char *p = s + i;
 		if (*p == '\\' || *p == '"')
 			debug_printf("\\%c", *p);
 		else if (isprint((unsigned char)*p))
 			debug_printf("%c", *p);
 		else if (*p == '\n')
 			debug_printf("\\n");
 		else if (*p == '\t')
 			debug_printf("\\t");
 		else
 			debug_printf("\\x%02x", (unsigned char)*p);
+	}
 	debug_printf("%s", suffix);
+}
 void
 debug_print_buf(const char *name, const struct buffer *buf)
+{
 	if (buf->len > 0) {
 		debug_printf(" %s ", name);
 		debug_vis_range("\"", buf->s, buf->len, "\"");
+	}
+}
 void
 debug_buffers(void)
+{
 	debug_print_buf("label", &lab);
 	debug_print_buf("code", &code);
 	debug_print_buf("comment", &com);
 	debug_blank_line();
+}
 static void
 write_ps_bool(const char *name, bool prev, bool curr)
+{
 	if (!state.ps_first && curr != prev) {
 		char diff = " -+x"[(prev ? 1 : 0) + (curr ? 2 : 0)];
 		debug_println("        [%c]  ps.%s", diff, name);
 	} else if (config.full_parser_state || state.ps_first)
 		debug_println("        [%c]  ps.%s", curr ? 'x' : ' ', name);
+}
 static void
 write_ps_int(const char *name, int prev, int curr)
+{
 	if (!state.ps_first && curr != prev)
 		debug_println(" %3d -> %3d  ps.%s", prev, curr, name);
 	else if (config.full_parser_state || state.ps_first)
 		debug_println("        %3d  ps.%s", curr, name);
+}
 static void
 write_ps_enum(const char *name, const char *prev, const char *curr)
+{
 	if (!state.ps_first && strcmp(prev, curr) != 0)
 		debug_println(" %3s -> %3s  ps.%s", prev, curr, name);
 	else if (config.full_parser_state || state.ps_first)
 		debug_println(" %10s  ps.%s", curr, name);
+}
 static bool
 ps_paren_has_changed(void)
+{
 	if (state.prev_ps.nparen != ps.nparen)
 		return true;
 	const struct paren_level *prev = state.prev_ps.paren, *curr = ps.paren;
 	for (int i = 0; i < ps.nparen; i++)
 		if (curr[i].indent != prev[i].indent
 		    || curr[i].cast != prev[i].cast)
 			return true;
 	return false;
+}
 static void
 debug_ps_paren(void)
+{
 	if (!config.full_parser_state && !ps_paren_has_changed()
 	    && !state.ps_first)
 		return;
 	debug_printf("             ps.paren:");
 	for (int i = 0; i < ps.nparen; i++) {
 		debug_printf(" %s%d",
 		    paren_level_cast_name[ps.paren[i].cast],
 		    ps.paren[i].indent);
+	}
 	if (ps.nparen == 0)
 		debug_printf(" none");
 	debug_println("");
+}
 static bool
 ps_di_stack_has_changed(void)
+{
 	if (state.prev_ps.decl_level != ps.decl_level)
 		return true;
 	for (int i = 0; i < ps.decl_level; i++)
 		if (state.prev_ps.di_stack[i] != ps.di_stack[i])
 			return true;
 	return false;
+}
 static void
 debug_ps_di_stack(void)
+{
 	bool changed = ps_di_stack_has_changed();
 	if (!config.full_parser_state && !changed && !state.ps_first)
 		return;
 	debug_printf("     %s      ps.di_stack:", changed ? "->" : "  ");
 	for (int i = 0; i < ps.decl_level; i++)
 		debug_printf(" %d", ps.di_stack[i]);
 	if (ps.decl_level == 0)
 		debug_printf(" none");
 	debug_println("");
+}
 #define debug_ps_bool(name) \
 	write_ps_bool(#name, state.prev_ps.name, ps.name)
 #define debug_ps_int(name) \
 	write_ps_int(#name, state.prev_ps.name, ps.name)
 #define debug_ps_enum(name, names) \
         write_ps_enum(#name, (names)[state.prev_ps.name], (names)[ps.name])
 void
 debug_parser_state(void)
+{
 	debug_blank_line();
 	state.heading = "token classification";
 	debug_ps_enum(prev_lsym, lsym_name);
 	debug_ps_bool(in_stmt_or_decl);
 	debug_ps_bool(in_decl);
 	debug_ps_bool(in_var_decl);
 	debug_ps_bool(in_init);
 	debug_ps_int(init_level);
 	debug_ps_bool(line_has_func_def);
 	debug_ps_bool(in_func_def_params);
 	debug_ps_bool(line_has_decl);
 	debug_ps_enum(lbrace_kind, psym_name);
 	debug_ps_enum(spaced_expr_psym, psym_name);
 	debug_ps_bool(seen_case);
 	debug_ps_bool(prev_paren_was_cast);
 	debug_ps_int(quest_level);
 	state.heading = "indentation of statements and declarations";
 	debug_ps_int(ind_level);
 	debug_ps_int(ind_level_follow);
 	debug_ps_bool(in_stmt_cont);
 	debug_ps_int(decl_level);
 	debug_ps_di_stack();
 	debug_ps_bool(decl_indent_done);
 	debug_ps_int(decl_ind);
 	debug_ps_bool(tabs_to_var);
 	debug_ps_enum(extra_expr_indent, extra_expr_indent_name);
 	// The parser symbol stack is printed in debug_psyms_stack instead.
 	state.heading = "spacing inside a statement or declaration";
 	debug_ps_bool(next_unary);
 	debug_ps_bool(want_blank);
 	debug_ps_int(ind_paren_level);
 	debug_ps_int(nparen);
 	debug_ps_paren();
 	state.heading = "horizontal spacing for comments";
 	debug_ps_int(comment_delta);
 	debug_ps_int(n_comment_delta);
 	debug_ps_int(com_ind);
 	state.heading = "vertical spacing";
 	debug_ps_bool(break_after_comma);
 	debug_ps_bool(force_nl);
 	debug_ps_enum(declaration, declaration_name);
 	debug_ps_bool(blank_line_after_decl);
 	state.heading = "comments";
 	debug_ps_bool(curr_col_1);
 	debug_ps_bool(next_col_1);
 	state.heading = NULL;
 	debug_blank_line();
 	state.prev_ps = ps;
 	state.ps_first = false;
+}
 void
 debug_psyms_stack(const char *situation)
+{
 	debug_printf("parse stack %s:", situation);
 	const struct psym_stack *psyms = &ps.psyms;
 	for (int i = 0; i <= psyms->top; ++i)
 		debug_printf(" %d %s",
 		    psyms->ind_level[i], psym_name[psyms->sym[i]]);
 	debug_println("");
+}
 #endif

 @@ -1,534 +1,533 @@
-/*	$NetBSD: indent.h,v 1.189 2023/06/14 07:20:55 rillig Exp $	*/
+/*	$NetBSD: indent.h,v 1.190 2023/06/14 08:25:15 rillig Exp $	*/
 /*-
  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
+ *
  * Copyright (c) 2001 Jens Schweikhardt
  * All rights reserved.
+ *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
+ *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 /*-
  * SPDX-License-Identifier: BSD-4-Clause
+ *
  * Copyright (c) 1985 Sun Microsystems, Inc.
  * Copyright (c) 1980, 1993
  *	The Regents of the University of California.  All rights reserved.
  * All rights reserved.
+ *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  * 3. All advertising materials mentioning features or use of this software
  *    must display the following acknowledgement:
  *	This product includes software developed by the University of
  *	California, Berkeley and its contributors.
  * 4. Neither the name of the University nor the names of its contributors
  *    may be used to endorse or promote products derived from this software
  *    without specific prior written permission.
+ *
  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 #include <ctype.h>
 #include <stdbool.h>
 #include <stdio.h>
 typedef enum lexer_symbol {
 	lsym_eof,
 	lsym_preprocessing,	/* the initial '#' of a preprocessing line */
 	lsym_newline,
 	lsym_comment,		/* the initial '/ *' or '//' of a comment */
 	lsym_lparen,
 	lsym_rparen,
 	lsym_lbracket,
 	lsym_rbracket,
 	lsym_lbrace,
 	lsym_rbrace,
 	lsym_period,
 	lsym_unary_op,		/* e.g. '*', '&', '-' or leading '++' */
 	lsym_sizeof,
 	lsym_offsetof,
 	lsym_postfix_op,	/* trailing '++' or '--' */
 	lsym_binary_op,		/* e.g. '*', '&', '<<', '&&' or '/=' */
 	lsym_question,		/* the '?' from a '?:' expression */
 	lsym_question_colon,	/* the ':' from a '?:' expression */
 	lsym_comma,
 	lsym_typedef,
 	lsym_modifier,		/* modifiers for types, functions, variables */
 	lsym_tag,		/* 'struct', 'union' or 'enum' */
 	lsym_type_outside_parentheses,
 	lsym_type_in_parentheses,
 	lsym_word,		/* identifier, constant or string */
 	lsym_funcname,		/* name of a function being defined */
 	lsym_label_colon,	/* the ':' after a label */
 	lsym_other_colon,	/* bit-fields, generic-association (C11),
 				 * enum-type-specifier (C23),
 				 * attribute-prefixed-token (C23),
 				 * pp-prefixed-parameter (C23 6.10) */
 	lsym_semicolon,
 	lsym_case,
 	lsym_default,
 	lsym_do,
 	lsym_else,
 	lsym_for,
 	lsym_if,
 	lsym_switch,
 	lsym_while,
 	lsym_return,
 } lexer_symbol;
 /*
  * Structure of the source code, in terms of declarations, statements and
  * braces; used to determine the indentation level of these parts.
  */
 typedef enum parser_symbol {
 	psym_0,			/* a placeholder; not stored on the stack */
 	psym_lbrace_block,	/* '{' for a block of code */
 	psym_lbrace_struct,	/* '{' in 'struct ... { ... }' */
 	psym_lbrace_union,	/* '{' in 'union ... { ... }' */
 	psym_lbrace_enum,	/* '{' in 'enum ... { ... }' */
 	psym_rbrace,		/* not stored on the stack */
 	psym_decl,
 	psym_stmt,
 	psym_for_exprs,		/* 'for' '(' ... ')' */
 	psym_if_expr,		/* 'if' '(' expr ')' */
 	psym_if_expr_stmt,	/* 'if' '(' expr ')' stmt */
 	psym_if_expr_stmt_else,	/* 'if' '(' expr ')' stmt 'else' */
 	psym_else,		/* 'else'; not stored on the stack */
 	psym_switch_expr,	/* 'switch' '(' expr ')' */
 	psym_do,		/* 'do' */
 	psym_do_stmt,		/* 'do' stmt */
 	psym_while_expr,	/* 'while' '(' expr ')' */
 } parser_symbol;
 /* A range of characters, only null-terminated in debug mode. */
 struct buffer {
 	char *s;
 	size_t len;
 	size_t cap;
 };
 extern FILE *input;
 extern FILE *output;
 /*
  * The current line from the input file, used by the lexer to generate tokens.
  * To read from the line, start at inp_p and continue up to and including the
  * next '\n'. To read beyond the '\n', call inp_skip or inp_next, which will
  * make the next line available, invalidating any pointers into the previous
  * line.
  */
 extern struct buffer inp;
 extern const char *inp_p;
 extern struct buffer token;	/* the current token to be processed, is
 				 * typically copied to the buffer 'code', or in
 				 * some cases to 'lab'. */
 extern struct buffer lab;	/* the label or preprocessor directive */
 extern struct buffer code;	/* the main part of the current line of code,
 				 * containing declarations or statements */
 extern struct buffer com;	/* the trailing comment of the line, or the
 				 * start or end of a multi-line comment, or
 				 * while in process_comment, a single line of a
 				 * multi-line comment */
 extern struct options {
 	bool blank_line_around_conditional_compilation;
 	bool blank_line_after_decl_at_top;	/* this is vaguely similar to
 						 * blank_line_after_decl except
 						 * that it only applies to the
 						 * first set of declarations in
 						 * a procedure (just after the
 						 * first '{') and it causes a
 						 * blank line to be generated
 						 * even if there are no
 						 * declarations */
 	bool blank_line_after_decl;
 	bool blank_line_after_proc;
 	bool blank_line_before_block_comment;
 	bool break_after_comma;	/* whether to add a line break after each
 				 * declarator */
 	bool brace_same_line;	/* whether a brace should be on same line as an
 				 * if, while, etc. */
 	bool blank_after_sizeof;
 	bool comment_delimiter_on_blank_line;
 	int decl_comment_column;	/* the column in which comments after
 					 * declarations should be put */
 	bool cuddle_else;	/* whether 'else' should cuddle up to '}' */
 	int continuation_indent;	/* the indentation between the edge of
 					 * code and continuation lines */
 	float case_indent;	/* the distance (measured in indentation
 				 * levels) to indent case labels from the
 				 * switch statement */
 	int comment_column;	/* the column in which comments to the right of
 				 * code should start */
 	int decl_indent;	/* indentation of identifier in declaration */
 	bool left_justify_decl;
 	int unindent_displace;	/* comments not to the right of code will be
 				 * placed this many indentation levels to the
 				 * left of code */
 	bool extra_expr_indent;	/* whether continuation lines from the
 				 * expression part of "if (e)", "while (e)",
 				 * "for (e; e; e)" should be indented an extra
 				 * tab stop so that they are not confused with
 				 * the code that follows */
 	bool else_if_in_same_line;
 	bool function_brace_split;	/* split function declaration and brace
 					 * onto separate lines */
 	bool format_col1_comments;	/* whether comments that start in
 					 * column 1 are to be reformatted (just
 					 * like comments that begin in later
 					 * columns) */
 	bool format_block_comments;	/* whether to reformat comments that
 					 * begin with '/ * \n' */
 	bool indent_parameters;
 	int indent_size;	/* the size of one indentation level */
 	int block_comment_max_line_length;
 	int local_decl_indent;	/* like decl_indent but for locals */
 	bool lineup_to_parens_always;	/* whether to not(?) attempt to keep
 					 * lined-up code within the margin */
 	bool lineup_to_parens;	/* whether continued code within parens will be
 				 * lined up to the open paren */
 	bool proc_calls_space;	/* whether function calls look like: foo (bar)
 				 * rather than foo(bar) */
 	bool procnames_start_line;	/* whether the names of functions being
 					 * defined get placed in column 1 (i.e.
 					 * a newline is placed between the type
 					 * of the function and its name) */
 	bool space_after_cast;	/* "b = (int) a" vs. "b = (int)a" */
 	bool star_comment_cont;	/* whether comment continuation lines should
 				 * have stars at the beginning of each line */
 	bool swallow_optional_blank_lines;
 	bool auto_typedefs;	/* whether to recognize identifiers ending in
 				 * "_t" like typedefs */
 	int tabsize;		/* the size of a tab */
 	int max_line_length;
 	bool use_tabs;		/* set true to use tabs for spacing, false uses
 				 * all spaces */
 	bool verbose;		/* print configuration to stderr */
 } opt;
 extern bool found_err;
 extern bool had_eof;		/* whether input is exhausted */
 extern int line_no;		/* the current input line number */
 extern enum indent_enabled {
 	indent_on,
 	indent_off,
 	indent_last_off_line,
 } indent_enabled;
 #define	STACKSIZE 256
 /* Properties of each level of parentheses or brackets. */
 struct paren_level {
 	int indent;		/* indentation of the operand/argument,
 				 * relative to the enclosing statement; if
 				 * negative, reflected at -1 */
 	enum paren_level_cast {
 		cast_unknown,
 		cast_maybe,
 		cast_no,
 	} cast;			/* whether the parentheses form a type cast */
 };
 struct psym_stack {
 	int top;		/* pointer to top of stack */
 	parser_symbol sym[STACKSIZE];
 	int ind_level[STACKSIZE];
 };
 /*
  * The parser state determines the layout of the formatted text.
+ *
  * At each '#if', the parser state is copied so that the corresponding '#else'
  * lines start in the same state.
+ *
  * In a function body, the number of block braces determines the indentation
  * of statements and declarations.
+ *
  * In a statement, the number of parentheses or brackets determines the
  * indentation of follow-up lines.
+ *
  * In an expression, the token type determine whether to put spaces around.
+ *
  * In a source file, the types of line determine the vertical spacing, such as
  * around preprocessing directives or function bodies, or above block
  * comments.
  */
 extern struct parser_state {
 	lexer_symbol prev_lsym;	/* the previous token, but never comment,
 				 * newline or preprocessing line */
 	/* Token classification */
 	bool in_stmt_or_decl;	/* whether in a statement or a struct
 				 * declaration or a plain declaration */
 	bool in_decl;		/* XXX: double-check the exact meaning */
 	bool in_var_decl;	/* starts at a type name or a '){' from a
 				 * compound literal; ends at the '(' from a
 				 * function definition or a ';' outside '{}';
 				 * when active, '{}' form struct or union
 				 * declarations, ':' marks a bit-field, and '='
 				 * starts an initializer */
 	bool in_init;		/* whether inside an initializer */
 	int init_level;		/* the number of '{}' in an initializer */
 	bool line_has_func_def;	/* starts either at the 'name(' from a function
 				 * definition if it occurs at the beginning of
 				 * a line, or at the first '*' from inside a
 				 * declaration when the line starts with words
 				 * followed by a '(' */
 	bool in_func_def_params;	/* for old-style functions */
 	bool line_has_decl;	/* whether this line of code has part of a
 				 * declaration on it; used for indenting
 				 * comments */
 	parser_symbol lbrace_kind;	/* the kind of brace to be pushed to
 					 * the parser symbol stack next */
 	parser_symbol spaced_expr_psym;	/* the parser symbol to be shifted
 					 * after the parenthesized expression
 					 * from a 'for', 'if', 'switch' or
 					 * 'while'; or psym_0 */
 	bool seen_case;		/* whether there was a 'case' or 'default', to
 				 * properly space the following ':' */
 	bool prev_paren_was_cast;
 	int quest_level;	/* when this is positive, we have seen a '?'
 				 * without the matching ':' in a '?:'
 				 * expression */
 	/* Indentation of statements and declarations */
 	int ind_level;		/* the indentation level for the line that is
 				 * currently prepared for output */
 	int ind_level_follow;	/* the level to which ind_level should be set
 				 * after the current line is printed */
 	bool in_stmt_cont;	/* whether the current line should have an
 				 * extra indentation level because we are in
 				 * the middle of a statement */
 	int decl_level;		/* current nesting level for a structure
 				 * declaration or an initializer */
 	int di_stack[20];	/* a stack of structure indentation levels */
 	bool decl_indent_done;	/* whether the indentation for a declaration
 				 * has been added to the code buffer. */
 	int decl_ind;		/* current indentation for declarations */
 	bool tabs_to_var;	/* true if using tabs to indent to var name */
 	enum {
 		eei_no,
 		eei_maybe,
 		eei_last
 	} extra_expr_indent;
 	struct psym_stack psyms;
 	/* Spacing inside a statement or declaration */
 	bool next_unary;	/* whether the following operator should be
 				 * unary; is used in declarations for '*', as
 				 * well as in expressions */
 	bool want_blank;	/* whether the following token should be
 				 * prefixed by a blank. (Said prefixing is
 				 * ignored in some cases.) */
 	int ind_paren_level;	/* the number of parentheses or brackets that
 				 * is used for indenting a continuation line of
 				 * a declaration, initializer or statement */
 	int nparen;		/* the number of parentheses or brackets that
 				 * are currently open; used to indent the
 				 * remaining lines of the statement,
 				 * initializer or declaration */
 	struct paren_level paren[20];
 	/* Horizontal spacing for comments */
 	int comment_delta;	/* used to set up indentation for all lines of
 				 * a boxed comment after the first one */
 	int n_comment_delta;	/* remembers how many columns there were before
 				 * the start of a box comment so that
 				 * forthcoming lines of the comment are
 				 * indented properly */
 	int com_ind;		/* indentation of the current comment */
 	/* Vertical spacing */
 	bool break_after_comma;	/* whether to add a newline after the next
 				 * comma; used in declarations but not in
 				 * initializer lists */
 	bool force_nl;		/* whether the next token is forced to go to a
 				 * new line; used after 'if (expr)' and in
 				 * similar situations; tokens like '{' may
 				 * ignore this */
 	enum declaration {
 		decl_no,	/* no declaration anywhere nearby */
 		decl_begin,	/* collecting tokens of a declaration */
 		decl_end,	/* finished a declaration */
 	} declaration;
 	bool blank_line_after_decl;
 	/* Comments */
-	bool curr_col_1;	/* whether the current token started in column
+	bool next_col_1;	/* whether the next token starts in column 1 of
-				 * 1 of the original input */
+				 * the original input */
 	bool next_col_1;
 } ps;
 extern struct output_state {
 	enum line_kind {
 		lk_other,
 		lk_blank,
 		lk_if,		/* #if, #ifdef, #ifndef */
 		lk_endif,	/* #endif */
 		lk_stmt_head,	/* the ')' of an incomplete statement such as
 				 * 'if (expr)' or 'for (expr; expr; expr)' */
 		lk_func_end,	/* the last '}' of a function body */
 		lk_block_comment,
 		lk_case_or_default,
 	} line_kind;		/* kind of the line that is being prepared for
 				 * output; is reset to lk_other each time after
 				 * trying to send a line to the output, even if
 				 * that line was a suppressed blank line; used
 				 * for inserting or removing blank lines */
 	enum line_kind prev_line_kind;	/* the kind of line that was actually
 					 * sent to the output */
 	struct buffer indent_off_text;	/* text from between 'INDENT OFF' and
 					 * 'INDENT ON', both inclusive */
 } out;
 #define array_length(array) (sizeof(array) / sizeof((array)[0]))
 #ifdef debug
 void debug_printf(const char *, ...) __printflike(1, 2);
 void debug_println(const char *, ...) __printflike(1, 2);
 void debug_blank_line(void);
 void debug_vis_range(const char *, const char *, size_t, const char *);
 void debug_parser_state(void);
 void debug_psyms_stack(const char *);
 void debug_print_buf(const char *, const struct buffer *);
 void debug_buffers(void);
 extern const char *const lsym_name[];
 extern const char *const psym_name[];
 extern const char *const paren_level_cast_name[];
 extern const char *const line_kind_name[];
 #else
 #define debug_noop() do { } while (false)
 #define	debug_printf(fmt, ...) debug_noop()
 #define	debug_println(fmt, ...) debug_noop()
 #define debug_blank_line() debug_noop()
 #define	debug_vis_range(prefix, s, e, suffix) debug_noop()
 #define	debug_parser_state() debug_noop()
 #define	debug_psyms_stack(situation) debug_noop()
 #define debug_print_buf(name, buf) debug_noop()
 #define	debug_buffers() debug_noop()
 #endif
 void register_typename(const char *);
 int compute_code_indent(void);
 int compute_label_indent(void);
 int ind_add(int, const char *, size_t);
 void inp_skip(void);
 char inp_next(void);
 void finish_output(void);
 lexer_symbol lexi(void);
 void diag(int, const char *, ...) __printflike(2, 3);
 void output_line(void);
 void inp_read_line(void);
 void parse(parser_symbol);
 void process_comment(void);
 void set_option(const char *, const char *);
 void load_profile_files(const char *);
 void *nonnull(void *);
 void buf_add_char(struct buffer *, char);
 void buf_add_chars(struct buffer *, const char *, size_t);
 static inline bool
 ch_isalnum(char ch)
+{
 	return isalnum((unsigned char)ch) != 0;
+}
 static inline bool
 ch_isalpha(char ch)
+{
 	return isalpha((unsigned char)ch) != 0;
+}
 static inline bool
 ch_isblank(char ch)
+{
 	return ch == ' ' || ch == '\t';
+}
 static inline bool
 ch_isdigit(char ch)
+{
 	return '0' <= ch && ch <= '9';
+}
 static inline bool
 ch_isspace(char ch)
+{
 	return isspace((unsigned char)ch) != 0;
+}
 static inline int
 next_tab(int ind)
+{
 	return ind - ind % opt.tabsize + opt.tabsize;
+}
 #ifdef debug
 void buf_terminate(struct buffer *);
 #else
 #define buf_terminate(buf) debug_noop()
 #endif
 static inline void
 buf_clear(struct buffer *buf)
+{
 	buf->len = 0;
 	buf_terminate(buf);
+}

 @@ -1,687 +1,685 @@
-/*	$NetBSD: lexi.c,v 1.225 2023/06/10 16:43:56 rillig Exp $	*/
+/*	$NetBSD: lexi.c,v 1.226 2023/06/14 08:25:15 rillig Exp $	*/
 /*-
  * SPDX-License-Identifier: BSD-4-Clause
+ *
  * Copyright (c) 1985 Sun Microsystems, Inc.
  * Copyright (c) 1980, 1993
  *	The Regents of the University of California.  All rights reserved.
  * All rights reserved.
+ *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  * 3. All advertising materials mentioning features or use of this software
  *    must display the following acknowledgement:
  *	This product includes software developed by the University of
  *	California, Berkeley and its contributors.
  * 4. Neither the name of the University nor the names of its contributors
  *    may be used to endorse or promote products derived from this software
  *    without specific prior written permission.
+ *
  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 #include <sys/cdefs.h>
-__RCSID("$NetBSD: lexi.c,v 1.225 2023/06/10 16:43:56 rillig Exp $");
+__RCSID("$NetBSD: lexi.c,v 1.226 2023/06/14 08:25:15 rillig Exp $");
 #include <stdlib.h>
 #include <string.h>
 #include "indent.h"
 /* In lexi_alnum, this constant marks a type, independent of parentheses. */
 #define lsym_type lsym_type_outside_parentheses
 /* must be sorted alphabetically, is used in binary search */
 static const struct keyword {
 	const char name[12];
 	lexer_symbol lsym;
 } keywords[] = {
 	{"_Bool", lsym_type},
 	{"_Complex", lsym_type},
 	{"_Imaginary", lsym_type},
 	{"auto", lsym_modifier},
 	{"bool", lsym_type},
 	{"break", lsym_word},
 	{"case", lsym_case},
 	{"char", lsym_type},
 	{"complex", lsym_type},
 	{"const", lsym_modifier},
 	{"continue", lsym_word},
 	{"default", lsym_default},
 	{"do", lsym_do},
 	{"double", lsym_type},
 	{"else", lsym_else},
 	{"enum", lsym_tag},
 	{"extern", lsym_modifier},
 	{"float", lsym_type},
 	{"for", lsym_for},
 	{"goto", lsym_word},
 	{"if", lsym_if},
 	{"imaginary", lsym_type},
 	{"inline", lsym_modifier},
 	{"int", lsym_type},
 	{"long", lsym_type},
 	{"offsetof", lsym_offsetof},
 	{"register", lsym_modifier},
 	{"restrict", lsym_word},
 	{"return", lsym_return},
 	{"short", lsym_type},
 	{"signed", lsym_type},
 	{"sizeof", lsym_sizeof},
 	{"static", lsym_modifier},
 	{"struct", lsym_tag},
 	{"switch", lsym_switch},
 	{"typedef", lsym_typedef},
 	{"union", lsym_tag},
 	{"unsigned", lsym_type},
 	{"void", lsym_type},
 	{"volatile", lsym_modifier},
 	{"while", lsym_while}
 };
 static struct {
 	const char **items;
 	unsigned int len;
 	unsigned int cap;
 } typenames;
 /*-
  * The transition table below was rewritten by hand from lx's output, given
  * the following definitions. lx is Katherine Flavel's lexer generator.
+ *
  * O  = /[0-7]/;        D  = /[0-9]/;          NZ = /[1-9]/;
  * H  = /[a-f0-9]/i;    B  = /[0-1]/;          HP = /0x/i;
  * BP = /0b/i;          E  = /e[+\-]?/i D+;    P  = /p[+\-]?/i D+;
  * FS = /[fl]/i;        IS = /u/i /(l|L|ll|LL)/? | /(l|L|ll|LL)/ /u/i?;
+ *
  * D+           E  FS? -> $float;
  * D*    "." D+ E? FS? -> $float;
  * D+    "."    E? FS? -> $float;    HP H+           IS? -> $int;
  * HP H+        P  FS? -> $float;    NZ D*           IS? -> $int;
  * HP H* "." H+ P  FS? -> $float;    "0" O*          IS? -> $int;
  * HP H+ "."    P  FS  -> $float;    BP B+           IS? -> $int;
  */
 /* INDENT OFF */
 static const unsigned char lex_number_state[][26] = {
 	/*                examples:
 	         s                      0xx
 	         t                    00xaa
 	         a     11       101100xxa..
 	         r   11ee0001101lbuuxx.a.pp
 	         t.01.e+008bLuxll0Ll.aa.p+0
 	states:  ABCDEFGHIJKLMNOPQRSTUVWXYZ */
 	[0] =   "uuiifuufiuuiiuiiiiiuiuuuuu",	/* (other) */
 	[1] =   "CEIDEHHHIJQ  U  Q  VUVVZZZ",	/* 0 */
 	[2] =   "DEIDEHHHIJQ  U  Q  VUVVZZZ",	/* 1 */
 	[3] =   "DEIDEHHHIJ   U     VUVVZZZ",	/* 2 3 4 5 6 7 */
 	[4] =   "DEJDEHHHJJ   U     VUVVZZZ",	/* 8 9 */
 	[5] =   "             U     VUVV   ",	/* A a C c D d */
 	[6] =   "  K          U     VUVV   ",	/* B b */
 	[7] =   "  FFF   FF   U     VUVV   ",	/* E e */
 	[8] =   "    f  f     U     VUVV  f",	/* F f */
 	[9] =   "  LLf  fL  PR   Li  L    f",	/* L */
 	[10] =  "  OOf  fO   S P O i O    f",	/* l */
 	[11] =  "                    FFX   ",	/* P p */
 	[12] =  "  MM    M  i  iiM   M     ",	/* U u */
 	[13] =  "  N                       ",	/* X x */
 	[14] =  "     G                 Y  ",	/* + - */
 	[15] =  "B EE    EE   T      W     ",	/* . */
 	/*       ABCDEFGHIJKLMNOPQRSTUVWXYZ */
 };
 /* INDENT ON */
 static const unsigned char lex_number_row[] = {
 	['0'] = 1,
 	['1'] = 2,
 	['2'] = 3, ['3'] = 3, ['4'] = 3, ['5'] = 3, ['6'] = 3, ['7'] = 3,
 	['8'] = 4, ['9'] = 4,
 	['A'] = 5, ['a'] = 5, ['C'] = 5, ['c'] = 5, ['D'] = 5, ['d'] = 5,
 	['B'] = 6, ['b'] = 6,
 	['E'] = 7, ['e'] = 7,
 	['F'] = 8, ['f'] = 8,
 	['L'] = 9,
 	['l'] = 10,
 	['P'] = 11, ['p'] = 11,
 	['U'] = 12, ['u'] = 12,
 	['X'] = 13, ['x'] = 13,
 	['+'] = 14, ['-'] = 14,
 	['.'] = 15,
 };
 static bool
 is_identifier_start(char ch)
+{
 	return ch_isalpha(ch) || ch == '_' || ch == '$';
+}
 static bool
 is_identifier_part(char ch)
+{
 	return ch_isalnum(ch) || ch == '_' || ch == '$';
+}
 static void
 token_add_char(char ch)
+{
 	buf_add_char(&token, ch);
+}
 static void
 lex_number(void)
+{
 	for (unsigned char s = 'A'; s != 'f' && s != 'i' && s != 'u';) {
 		unsigned char ch = (unsigned char)inp_p[0];
 		if (ch == '\\' && inp_p[1] == '\n') {
 			inp_p++;
 			inp_skip();
 			line_no++;
 			continue;
+		}
 		if (ch >= array_length(lex_number_row)
 		    || lex_number_row[ch] == 0)
 			break;
 		unsigned char row = lex_number_row[ch];
 		if (lex_number_state[row][s - 'A'] == ' ') {
 			/*-
 		         * lex_number_state[0][s - 'A'] now indicates the type:
 		         * f = floating, i = integer, u = unknown
 		         */
 			return;
+		}
 		s = lex_number_state[row][s - 'A'];
 		token_add_char(inp_next());
+	}
+}
 static void
 lex_word(void)
+{
 	for (;;) {
 		if (is_identifier_part(inp_p[0]))
 			token_add_char(*inp_p++);
 		else if (inp_p[0] == '\\' && inp_p[1] == '\n') {
 			inp_p++;
 			inp_skip();
 			line_no++;
 		} else
 			return;
+	}
+}
 static void
 lex_char_or_string(void)
+{
 	for (char delim = token.s[token.len - 1];;) {
 		if (inp_p[0] == '\n') {
 			diag(1, "Unterminated literal");
 			return;
+		}
 		token_add_char(*inp_p++);
 		if (token.s[token.len - 1] == delim)
 			return;
 		if (token.s[token.len - 1] == '\\') {
 			if (inp_p[0] == '\n')
 				++line_no;
 			token_add_char(inp_next());
+		}
+	}
+}
 /* Guess whether the current token is a declared type. */
 static bool
 probably_typename(void)
+{
 	if (ps.prev_lsym == lsym_modifier)
 		return true;
 	if (ps.in_init)
 		return false;
 	if (ps.in_stmt_or_decl)	/* XXX: this condition looks incorrect */
 		return false;
 	if (ps.prev_lsym == lsym_semicolon
 	    || ps.prev_lsym == lsym_lbrace
 	    || ps.prev_lsym == lsym_rbrace) {
 		if (inp_p[0] == '*' && inp_p[1] != '=')
 			return true;
 		/* XXX: is_identifier_start */
 		if (ch_isalpha(inp_p[0]))
 			return true;
+	}
 	return false;
+}
 static int
 bsearch_typenames(const char *key)
+{
 	const char **arr = typenames.items;
 	unsigned lo = 0;
 	unsigned hi = typenames.len;
 	while (lo < hi) {
 		unsigned mid = (lo + hi) / 2;
 		int cmp = strcmp(arr[mid], key);
 		if (cmp < 0)
 			lo = mid + 1;
 		else if (cmp > 0)
 			hi = mid;
 		else
 			return (int)mid;
+	}
 	return -1 - (int)lo;
+}
 static bool
 is_typename(void)
+{
 	if (opt.auto_typedefs &&
 	    token.len >= 2 && memcmp(token.s + token.len - 2, "_t", 2) == 0)
 		return true;
 	return bsearch_typenames(token.s) >= 0;
+}
 void
 register_typename(const char *name)
+{
 	if (typenames.len >= typenames.cap) {
 		typenames.cap = 16 + 2 * typenames.cap;
 		typenames.items = nonnull(realloc(typenames.items,
 			sizeof(typenames.items[0]) * typenames.cap));
+	}
 	int pos = bsearch_typenames(name);
 	if (pos >= 0)
 		return;		/* already in the list */
 	pos = -1 - pos;
 	memmove(typenames.items + pos + 1, typenames.items + pos,
 	    sizeof(typenames.items[0]) * (typenames.len++ - (unsigned)pos));
 	typenames.items[pos] = nonnull(strdup(name));
+}
 static int
 cmp_keyword_by_name(const void *key, const void *elem)
+{
 	return strcmp(key, ((const struct keyword *)elem)->name);
+}
 /*
  * Looking at something like 'function_name(...)' in a line, guess whether
  * this starts a function definition or a declaration.
  */
 static bool
 probably_function_definition(void)
+{
 	int paren_level = 0;
 	for (const char *p = inp_p; *p != '\n'; p++) {
 		if (*p == '(')
 			paren_level++;
 		if (*p == ')' && --paren_level == 0) {
 			p++;
 			while (*p != '\n'
 			    && (ch_isspace(*p) || is_identifier_part(*p)))
 				p++;	/* '__dead' or '__unused' */
 			if (*p == '\n')	/* func(...) */
 				break;
 			if (*p == ';')	/* func(...); */
 				return false;
 			if (*p == ',')	/* double abs(), pi; */
 				return false;
 			if (*p == '(')	/* func(...) __attribute__((...)) */
 				paren_level++;	/* func(...) __printflike(...)
 						 */
 			else
 				break;	/* func(...) { ... */
+		}
 		if (paren_level == 1 && p[0] == '*' && p[1] == ',')
 			return false;
+	}
 	/* To further reduce the cases where indent wrongly treats an
 	 * incomplete function declaration as a function definition, thus
 	 * adding a newline before the function name, it may be worth looking
 	 * for parameter names, as these are often omitted in function
 	 * declarations and only included in function definitions. Or just
 	 * increase the lookahead to more than just the current line of input,
 	 * until the next '{'. */
 	return true;
+}
 static lexer_symbol
 lexi_alnum(void)
+{
 	if (ch_isdigit(inp_p[0]) ||
 	    (inp_p[0] == '.' && ch_isdigit(inp_p[1]))) {
 		lex_number();
 	} else if (is_identifier_start(inp_p[0])) {
 		lex_word();
 		if (token.len == 1 && token.s[0] == 'L' &&
 		    (inp_p[0] == '"' || inp_p[0] == '\'')) {
 			token_add_char(*inp_p++);
 			lex_char_or_string();
 			ps.next_unary = false;
 			return lsym_word;
+		}
 	} else
 		return lsym_eof;	/* just as a placeholder */
 	while (ch_isblank(inp_p[0]))
 		inp_p++;
 	ps.next_unary = ps.prev_lsym == lsym_tag
 	    || ps.prev_lsym == lsym_typedef;
 	if (ps.prev_lsym == lsym_tag && ps.nparen == 0)
 		return lsym_type_outside_parentheses;
 	token_add_char('\0');
 	token.len--;
 	const struct keyword *kw = bsearch(token.s, keywords,
 	    array_length(keywords), sizeof(keywords[0]), cmp_keyword_by_name);
 	lexer_symbol lsym = lsym_word;
 	if (kw != NULL) {
 		if (kw->lsym == lsym_type)
 			lsym = lsym_type_in_parentheses;
 		ps.next_unary = true;
 		if (kw->lsym == lsym_tag || kw->lsym == lsym_type)
 			goto found_typename;
 		return kw->lsym;
+	}
 	if (is_typename()) {
 		lsym = lsym_type_in_parentheses;
 		ps.next_unary = true;
 found_typename:
 		if (ps.nparen > 0) {
 			/* inside parentheses: cast, param list, offsetof or
 			 * sizeof */
 			if (ps.paren[ps.nparen - 1].cast == cast_unknown)
 				ps.paren[ps.nparen - 1].cast = cast_maybe;
+		}
 		if (ps.prev_lsym != lsym_period
 		    && ps.prev_lsym != lsym_unary_op) {
 			if (kw != NULL && kw->lsym == lsym_tag)
 				return lsym_tag;
 			if (ps.nparen == 0)
 				return lsym_type_outside_parentheses;
+		}
+	}
 	if (inp_p[0] == '(' && ps.psyms.top <= 1 && ps.ind_level == 0 &&
 	    !ps.in_func_def_params && !ps.in_init) {
 		if (ps.nparen == 0 && probably_function_definition()) {
 			ps.line_has_func_def = true;
 			if (ps.in_decl)
 				ps.in_func_def_params = true;
 			return lsym_funcname;
+		}
 	} else if (ps.nparen == 0 && probably_typename()) {
 		ps.next_unary = true;
 		return lsym_type_outside_parentheses;
+	}
 	return lsym;
+}
 static bool
 is_asterisk_pointer(void)
+{
 	if (inp_p[strspn(inp_p, "* \t")] == ')')
 		return true;
 	if (ps.next_unary || ps.in_func_def_params)
 		return true;
 	if (ps.prev_lsym == lsym_word ||
 	    ps.prev_lsym == lsym_rparen ||
 	    ps.prev_lsym == lsym_rbracket)
 		return false;
 	return ps.in_decl && ps.nparen > 0;
+}
 static bool
 probably_in_function_definition(void)
+{
 	for (const char *tp = inp_p; *tp != '\n';) {
 		if (ch_isspace(*tp))
 			tp++;
 		else if (is_identifier_start(*tp)) {
 			tp++;
 			while (is_identifier_part(*tp))
 				tp++;
 		} else
 			return *tp == '(';
+	}
 	return false;
+}
 static void
 lex_asterisk_pointer(void)
+{
 	while (inp_p[0] == '*' || ch_isspace(inp_p[0])) {
 		if (inp_p[0] == '*')
 			token_add_char('*');
 		inp_skip();
+	}
 	if (ps.in_decl && probably_in_function_definition())
 		ps.line_has_func_def = true;
+}
 static bool
 skip(const char **pp, const char *s)
+{
 	size_t len = strlen(s);
 	while (ch_isblank(**pp))
 		(*pp)++;
 	if (strncmp(*pp, s, len) == 0) {
 		*pp += len;
 		return true;
+	}
 	return false;
+}
 static void
 lex_indent_comment(void)
+{
 	const char *p = inp.s;
 	if (skip(&p, "/*") && skip(&p, "INDENT")) {
 		enum indent_enabled enabled;
 		if (skip(&p, "ON") || *p == '*')
 			enabled = indent_last_off_line;
 		else if (skip(&p, "OFF"))
 			enabled = indent_off;
 		else
 			return;
 		if (skip(&p, "*/\n")) {
 			if (lab.len > 0 || code.len > 0 || com.len > 0)
 				output_line();
 			indent_enabled = enabled;
+		}
+	}
+}
 /* Reads the next token, placing it in the global variable "token". */
 lexer_symbol
 lexi(void)
+{
 	buf_clear(&token);
 	ps.curr_col_1 = ps.next_col_1;
 	ps.next_col_1 = false;
 	for (;;) {
-		if (ch_isblank(inp_p[0])) {
+		if (ch_isblank(inp_p[0]))
 			ps.curr_col_1 = false;
 			inp_p++;
-		} else if (inp_p[0] == '\\' && inp_p[1] == '\n') {
+		else if (inp_p[0] == '\\' && inp_p[1] == '\n') {
 			inp_p++;
 			inp_skip();
 			line_no++;
 		} else
 			break;
+	}
 	lexer_symbol alnum_lsym = lexi_alnum();
 	if (alnum_lsym != lsym_eof)
 		return alnum_lsym;
 	/* Scan a non-alphanumeric token */
 	token_add_char(inp_next());
 	lexer_symbol lsym;
 	bool next_unary;
 	switch (token.s[token.len - 1]) {
 	case '#':
 		lsym = lsym_preprocessing;
 		next_unary = ps.next_unary;
 		break;
 	case '\n':
 		/* if data has been exhausted, the '\n' is a dummy. */
 		lsym = had_eof ? lsym_eof : lsym_newline;
 		next_unary = ps.next_unary;
 		ps.next_col_1 = true;
 		break;
 	/* INDENT OFF */
 	case '(':	lsym = lsym_lparen;	next_unary = true;	break;
 	case ')':	lsym = lsym_rparen;	next_unary = false;	break;
 	case '[':	lsym = lsym_lbracket;	next_unary = true;	break;
 	case ']':	lsym = lsym_rbracket;	next_unary = false;	break;
 	case '{':	lsym = lsym_lbrace;	next_unary = true;	break;
 	case '}':	lsym = lsym_rbrace;	next_unary = true;	break;
 	case '.':	lsym = lsym_period;	next_unary = false;	break;
 	case '?':	lsym = lsym_question;	next_unary = true;	break;
 	case ',':	lsym = lsym_comma;	next_unary = true;	break;
 	case ';':	lsym = lsym_semicolon;	next_unary = true;	break;
 	/* INDENT ON */
 	case '-':
 	case '+':
 		lsym = ps.next_unary ? lsym_unary_op : lsym_binary_op;
 		next_unary = true;
 		/* '++' or '--' */
 		if (inp_p[0] == token.s[token.len - 1]) {
 			token_add_char(*inp_p++);
 			if (ps.prev_lsym == lsym_word ||
 			    ps.prev_lsym == lsym_rparen ||
 			    ps.prev_lsym == lsym_rbracket) {
 				lsym = ps.next_unary
 				    ? lsym_unary_op : lsym_postfix_op;
 				next_unary = false;
+			}
 		} else if (inp_p[0] == '=') {	/* '+=' or '-=' */
 			token_add_char(*inp_p++);
 		} else if (inp_p[0] == '>') {	/* '->' */
 			token_add_char(*inp_p++);
 			lsym = lsym_unary_op;
 			next_unary = false;
 			ps.want_blank = false;
+		}
 		break;
 	case ':':
 		lsym = ps.quest_level > 0
 		    ? (ps.quest_level--, lsym_question_colon)
 		    : ps.in_var_decl ? lsym_other_colon : lsym_label_colon;
 		next_unary = true;
 		break;
 	case '*':
 		if (inp_p[0] == '=') {
 			token_add_char(*inp_p++);
 			lsym = lsym_binary_op;
 		} else if (is_asterisk_pointer()) {
 			lex_asterisk_pointer();
 			lsym = lsym_unary_op;
 		} else
 			lsym = lsym_binary_op;
 		next_unary = true;
 		break;
 	case '=':
 		if (ps.in_var_decl)
 			ps.in_init = true;
 		if (inp_p[0] == '=')
 			token_add_char(*inp_p++);
 		lsym = lsym_binary_op;
 		next_unary = true;
 		break;
 	case '>':
 	case '<':
 	case '!':		/* ops like <, <<, <=, !=, etc. */
 		if (inp_p[0] == '>' || inp_p[0] == '<' || inp_p[0] == '=')
 			token_add_char(*inp_p++);
 		if (inp_p[0] == '=')
 			token_add_char(*inp_p++);
 		lsym = ps.next_unary ? lsym_unary_op : lsym_binary_op;
 		next_unary = true;
 		break;
 	case '\'':
 	case '"':
 		lex_char_or_string();
 		lsym = lsym_word;
 		next_unary = false;
 		break;
 	default:
 		if (token.s[token.len - 1] == '/'
 		    && (inp_p[0] == '*' || inp_p[0] == '/')) {
 			enum indent_enabled prev = indent_enabled;
 			lex_indent_comment();
 			if (prev == indent_on && indent_enabled == indent_off)
 				buf_clear(&out.indent_off_text);
 			token_add_char(*inp_p++);
 			lsym = lsym_comment;
 			next_unary = ps.next_unary;
 			break;
+		}
 		/* punctuation like '%', '&&', '/', '^', '||', '~' */
 		lsym = ps.next_unary ? lsym_unary_op : lsym_binary_op;
 		if (inp_p[0] == token.s[token.len - 1])
 			token_add_char(*inp_p++), lsym = lsym_binary_op;
 		if (inp_p[0] == '=')
 			token_add_char(*inp_p++), lsym = lsym_binary_op;
 		next_unary = true;
+	}
 	ps.next_unary = next_unary;
 	return lsym;
+}

 @@ -1,357 +1,357 @@
-/*	$NetBSD: pr_comment.c,v 1.161 2023/06/10 16:43:56 rillig Exp $	*/
+/*	$NetBSD: pr_comment.c,v 1.162 2023/06/14 08:25:15 rillig Exp $	*/
 /*-
  * SPDX-License-Identifier: BSD-4-Clause
+ *
  * Copyright (c) 1985 Sun Microsystems, Inc.
  * Copyright (c) 1980, 1993
  *	The Regents of the University of California.  All rights reserved.
  * All rights reserved.
+ *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  * 3. All advertising materials mentioning features or use of this software
  *    must display the following acknowledgement:
  *	This product includes software developed by the University of
  *	California, Berkeley and its contributors.
  * 4. Neither the name of the University nor the names of its contributors
  *    may be used to endorse or promote products derived from this software
  *    without specific prior written permission.
+ *
  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 #include <sys/cdefs.h>
-__RCSID("$NetBSD: pr_comment.c,v 1.161 2023/06/10 16:43:56 rillig Exp $");
+__RCSID("$NetBSD: pr_comment.c,v 1.162 2023/06/14 08:25:15 rillig Exp $");
 #include <string.h>
 #include "indent.h"
 static void
 com_add_char(char ch)
+{
 	buf_add_char(&com, ch);
+}
 static void
 com_add_delim(void)
+{
 	if (opt.star_comment_cont)
 		buf_add_chars(&com, " * ", 3);
+}
 static bool
 fits_in_one_line(int com_ind, int max_line_length)
+{
 	for (const char *start = inp_p, *p = start; *p != '\n'; p++) {
 		if (p[0] == '*' && p[1] == '/') {
 			while (p - inp_p >= 2
 			    && ch_isblank(p[-1])
 			    && ch_isblank(p[-2]))
 				p--;
 			int len = ind_add(com_ind + 3,
 			    start, (size_t)(p - start));
 			len += p == start || ch_isblank(p[-1]) ? 2 : 3;
 			return len <= max_line_length;
+		}
+	}
 	return false;
+}
 static void
 analyze_comment(bool *p_may_wrap, bool *p_delim,
     int *p_ind, int *p_line_length)
+{
 	bool may_wrap = true;
 	bool delim = false;
 	int ind;
 	int line_length = opt.max_line_length;
-	if (ps.curr_col_1 && !opt.format_col1_comments) {
+	if (inp_p - inp.s == 2 && !opt.format_col1_comments) {
 		may_wrap = false;
 		ind = 0;
 	} else {
 		if (inp_p[0] == '-' || inp_p[0] == '*' ||
 		    token.s[token.len - 1] == '/' ||
 		    (inp_p[0] == '\n' && !opt.format_block_comments))
 			may_wrap = false;
 		if (code.len == 0 && inp_p[strspn(inp_p, "*")] == '\n')
 			out.line_kind = lk_block_comment;
 		if (com.len > 0)
 			output_line();
 		if (lab.len == 0 && code.len == 0) {
 			ind = (ps.ind_level - opt.unindent_displace)
 			    * opt.indent_size;
 			if (ind <= 0)
 				ind = opt.format_col1_comments ? 0 : 1;
 			line_length = opt.block_comment_max_line_length;
 			if (may_wrap && inp_p[0] == '\n')
 				delim = true;
 			if (may_wrap && opt.comment_delimiter_on_blank_line)
 				delim = true;
 		} else {
 			int target_ind = code.len > 0
 			    ? ind_add(compute_code_indent(), code.s, code.len)
 			    : ind_add(compute_label_indent(), lab.s, lab.len);
 			ind = ps.line_has_decl || ps.ind_level == 0
 			    ? opt.decl_comment_column - 1
 			    : opt.comment_column - 1;
 			if (ind <= target_ind)
 				ind = next_tab(target_ind);
 			if (ind + 25 > line_length)
 				line_length = ind + 25;
+		}
+	}
 	ps.com_ind = ind;
 	if (!may_wrap) {
 		/* Find out how much indentation there was originally, because
 		 * that much will have to be ignored by output_line. */
 		size_t len = (size_t)(inp_p - 2 - inp.s);
 		ps.n_comment_delta = -ind_add(0, inp.s, len);
 	} else {
 		ps.n_comment_delta = 0;
 		if (!(inp_p[0] == '\t' && !ch_isblank(inp_p[1])))
 			while (ch_isblank(inp_p[0]))
 				inp_p++;
+	}
 	*p_may_wrap = may_wrap;
 	*p_delim = delim;
 	*p_ind = ind;
 	*p_line_length = line_length;
+}
 static void
 copy_comment_start(bool may_wrap, bool *delim, int ind, int line_length)
+{
 	ps.comment_delta = 0;
 	com_add_char('/');
 	com_add_char(token.s[token.len - 1]);	/* either '*' or '/' */
 	if (may_wrap) {
 		if (!ch_isblank(inp_p[0]))
 			com_add_char(' ');
 		if (*delim && fits_in_one_line(ind, line_length))
 			*delim = false;
 		if (*delim) {
 			output_line();
 			com_add_delim();
+		}
+	}
+}
 static void
 copy_comment_wrap_text(int line_length, ssize_t *last_blank)
+{
 	int now_len = ind_add(ps.com_ind, com.s, com.len);
 	for (;;) {
 		char ch = inp_next();
 		if (ch_isblank(ch))
 			*last_blank = (ssize_t)com.len;
 		com_add_char(ch);
 		now_len++;
 		if (memchr("*\n\r\b\t", inp_p[0], 6) != NULL)
 			break;
 		if (now_len >= line_length && *last_blank != -1)
 			break;
+	}
 	ps.next_col_1 = false;
 	if (now_len <= line_length)
 		return;
 	if (ch_isspace(com.s[com.len - 1]))
 		return;
 	if (*last_blank == -1) {
 		/* only a single word in this line */
 		output_line();
 		com_add_delim();
 		return;
+	}
 	const char *last_word_s = com.s + *last_blank + 1;
 	size_t last_word_len = com.len - (size_t)(*last_blank + 1);
 	com.len = (size_t)*last_blank;
 	output_line();
 	com_add_delim();
 	/* Assume that output_line and com_add_delim don't invalidate the
 	 * "unused" part of the buffer beyond com.s + com.len. */
 	memmove(com.s + com.len, last_word_s, last_word_len);
 	com.len += last_word_len;
 	*last_blank = -1;
+}
 static bool
 copy_comment_wrap_newline(ssize_t *last_blank)
+{
 	*last_blank = -1;
 	if (ps.next_col_1) {
 		if (com.len == 0)
 			com_add_char(' ');	/* force empty output line */
 		if (com.len > 3) {
 			output_line();
 			com_add_delim();
+		}
 		output_line();
 		com_add_delim();
 	} else {
 		ps.next_col_1 = true;
 		if (!(com.len > 0 && ch_isblank(com.s[com.len - 1])))
 			com_add_char(' ');
 		*last_blank = (int)com.len - 1;
+	}
 	++line_no;
 	/* flush any blanks and/or tabs at start of next line */
 	inp_skip();		/* '\n' */
 	while (ch_isblank(inp_p[0]))
 		inp_p++;
 	if (inp_p[0] == '*' && inp_p[1] == '/')
 		return false;
 	if (inp_p[0] == '*') {
 		inp_p++;
 		while (ch_isblank(inp_p[0]))
 			inp_p++;
+	}
 	return true;
+}
 static void
 copy_comment_wrap_finish(int line_length, bool delim)
+{
 	if (delim) {
 		if (com.len > 3)
 			output_line();
 		else
 			buf_clear(&com);
 		com_add_char(' ');
 	} else {
 		size_t len = com.len;
 		while (ch_isblank(com.s[len - 1]))
 			len--;
 		int end_ind = ind_add(ps.com_ind, com.s, len);
 		if (end_ind + 3 > line_length)
 			output_line();
+	}
 	while (com.len >= 2
 	    && ch_isblank(com.s[com.len - 1])
 	    && ch_isblank(com.s[com.len - 2]))
 		com.len--;
 	buf_terminate(&com);
 	inp_p += 2;
 	if (com.len > 0 && ch_isblank(com.s[com.len - 1]))
 		buf_add_chars(&com, "*/", 2);
 	else
 		buf_add_chars(&com, " */", 3);
+}
 /*
  * Copy characters from 'inp' to 'com'. Try to keep comments from going over
  * the maximum line length. To do that, remember where the last blank, tab, or
  * newline was. When a line is filled, print up to the last blank and continue
  * copying.
  */
 static void
 copy_comment_wrap(int line_length, bool delim)
+{
 	ssize_t last_blank = -1;	/* index of the last blank in 'com' */
 	for (;;) {
 		if (inp_p[0] == '\n') {
 			if (had_eof)
 				goto unterminated_comment;
 			if (!copy_comment_wrap_newline(&last_blank))
 				goto end_of_comment;
 		} else if (inp_p[0] == '*' && inp_p[1] == '/')
 			goto end_of_comment;
 		else
 			copy_comment_wrap_text(line_length, &last_blank);
+	}
 end_of_comment:
 	copy_comment_wrap_finish(line_length, delim);
 	return;
 unterminated_comment:
 	diag(1, "Unterminated comment");
 	output_line();
+}
 static void
 copy_comment_nowrap(void)
+{
 	char kind = token.s[token.len - 1];
 	for (;;) {
 		if (inp_p[0] == '\n') {
 			if (kind == '/')
 				return;
 			if (had_eof) {
 				diag(1, "Unterminated comment");
 				output_line();
 				return;
+			}
 			if (com.len == 0)
 				com_add_char(' ');	/* force output of an
 							 * empty line */
 			output_line();
 			++line_no;
 			inp_skip();
 			continue;
+		}
 		com_add_char(*inp_p++);
 		if (com.len >= 2
 		    && com.s[com.len - 2] == '*'
 		    && com.s[com.len - 1] == '/'
 		    && kind == '*')
 			return;
+	}
+}
 /*
  * Scan, reformat and output a single comment, which is either a block comment
  * starting with '/' '*' or an end-of-line comment starting with '//'.
  */
 void
 process_comment(void)
+{
 	bool may_wrap, delim;
 	int ind, line_length;
 	analyze_comment(&may_wrap, &delim, &ind, &line_length);
 	copy_comment_start(may_wrap, &delim, ind, line_length);
 	if (may_wrap)
 		copy_comment_wrap(line_length, delim);
 	else
 		copy_comment_nowrap();
+}