Recent patches added indentation checks that discovered some cosmetic issues at the cost of making this check last as long as the rest of syntax-check combined on my system. Also, they're moving closer to us implementing yet another C parser (docs/apibuild.py being the other one). Revert the following commits: commit 11e1f11dd34f2688169c63c13ea8d99a64724369 syntax-check: Check for incorrect indentation in function body commit 2585a79e32e8b0d994ab35fd7c641eb9b96632e3 build-aux:check-spacing: Introduce a new rule to check misaligned stuff in parenthesises commit a033182f042a07ffbd4b9a50418670778ceddbf3 build-aux:check-spacing: Add wrapper function of CheckCurlyBrackets commit 6225626b6f0a4817d1f17de0bc5200c5d7986a3e build-aux:check-spacing: Add wrapper function of CheckWhiteSpaces commit c3875129d9bd094ffe90d54fbec86624ae88c40b build-aux:check-spacing: Add wrapper function of KillComments commit e995904c5691be3c21f4c6dbc1f067fe0c8e8515 build-aux:check-spacing: Add wrapper function of CheckFunctionBody commit 11e1f11dd34f2688169c63c13ea8d99a64724369 syntax-check: Check for incorrect indentation in function body This brings the speed of the script to a tolerable level and lets it focus on the more visible issues. Signed-off-by: Ján Tomko <jtomko@xxxxxxxxxx> --- build-aux/check-spacing.pl | 460 ++++++++++++++------------------------------- 1 file changed, 142 insertions(+), 318 deletions(-) diff --git a/build-aux/check-spacing.pl b/build-aux/check-spacing.pl index d36b004abf..ca8b434916 100755 --- a/build-aux/check-spacing.pl +++ b/build-aux/check-spacing.pl @@ -23,356 +23,180 @@ use strict; use warnings; -# -# CheckFunctionBody: -# $_[0]: $data(in) -# $_[1]: $location(in), which format is file-path:line-num:line-code -# $_[2]: $fn_linenum(inout), maintains start line-num of function body -# Returns 0 in case of success or 1 on failure -# -# Check incorrect indentation and blank first line in function body. -# For efficiency, it only checks the first line of function body. -# But it's enough for most cases. -# (It could be better that we use *state* to declare @fn_linenum and -# move it into this subroutine. But *state* requires version >= v5.10.) -# -sub CheckFunctionBody { - my $ret = 0; - my ($data, $location, $fn_linenum) = @_; +my $ret = 0; +my $incomment = 0; - # Check first line of function block - if ($$fn_linenum) { - if ($$data =~ /^\s*$/) { - print "Blank line before content in function body:\n$$location"; - $ret = 1; - } elsif ($$data !~ /^[ ]{4}\S/) { - unless ($$data =~ /^[ ]\w+:$/ || $$data =~ /^}/) { - print "Incorrect indentation in function body:\n$$location"; - $ret = 1; - } - } - $$fn_linenum = 0; - } +foreach my $file (@ARGV) { + # Per-file variables for multiline Curly Bracket (cb_) check + my $cb_linenum = 0; + my $cb_code = ""; + my $cb_scolon = 0; - # Detect start of function block - if ($$data =~ /^{$/) { - $$fn_linenum = $.; - } + open FILE, $file; - return $ret; -} + while (defined (my $line = <FILE>)) { + my $data = $line; + # For temporary modifications + my $tmpdata; -# -# KillComments: -# $_[0]: $data(inout) -# $_[1]: $incomment(inout) -# -# Remove all content of comments -# (Also, the @incomment could be declared with *state* and move it in.) -# -sub KillComments { - my ($data, $incomment) = @_; + # Kill any quoted , ; = or " + $data =~ s/'[";,=]'/'X'/g; - # Kill contents of multi-line comments - # and detect end of multi-line comments - if ($$incomment) { - if ($$data =~ m,\*/,) { - $$incomment = 0; - $$data =~ s,^.*\*/,*/,; - } else { - $$data = ""; - } - } + # Kill any quoted strings + $data =~ s,"(?:[^\\\"]|\\.)*","XXX",g; - # Kill single line comments, and detect - # start of multi-line comments - if ($$data =~ m,/\*.*\*/,) { - $$data =~ s,/\*.*\*/,/* */,; - } elsif ($$data =~ m,/\*,) { - $$incomment = 1; - $$data =~ s,/\*.*,/*,; - } + # Kill any C++ style comments + $data =~ s,//.*$,//,; - return; -} + next if $data =~ /^#/; -# -# CheckWhiteSpaces: -# $_[0]: $data(in) -# $_[1]: $location(in), which format is file-path:line-num:line-code -# Returns 0 in case of success or 1 on failure -# -# Check whitespaces according to code spec of libvirt. -# -sub CheckWhiteSpaces { - my $ret = 0; - my ($data, $location) = @_; + # Kill contents of multi-line comments + # and detect end of multi-line comments + if ($incomment) { + if ($data =~ m,\*/,) { + $incomment = 0; + $data =~ s,^.*\*/,*/,; + } else { + $data = ""; + } + } - # We need to match things like - # - # int foo (int bar, bool wizz); - # foo (bar, wizz); - # - # but not match things like: - # - # typedef int (*foo)(bar wizz) - # - # we can't do this (efficiently) without - # missing things like - # - # foo (*bar, wizz); - # - # We also don't want to spoil the $data so it can be used - # later on. + # Kill single line comments, and detect + # start of multi-line comments + if ($data =~ m,/\*.*\*/,) { + $data =~ s,/\*.*\*/,/* */,; + } elsif ($data =~ m,/\*,) { + $incomment = 1; + $data =~ s,/\*.*,/*,; + } - # For temporary modifications - my $tmpdata = $$data; - while ($tmpdata =~ /(\w+)\s\((?!\*)/) { - my $kw = $1; + # We need to match things like + # + # int foo (int bar, bool wizz); + # foo (bar, wizz); + # + # but not match things like: + # + # typedef int (*foo)(bar wizz) + # + # we can't do this (efficiently) without + # missing things like + # + # foo (*bar, wizz); + # + # We also don't want to spoil the $data so it can be used + # later on. + $tmpdata = $data; + while ($tmpdata =~ /(\w+)\s\((?!\*)/) { + my $kw = $1; + + # Allow space after keywords only + if ($kw =~ /^(?:if|for|while|switch|return)$/) { + $tmpdata =~ s/(?:$kw\s\()/XXX(/; + } else { + print "Whitespace after non-keyword:\n"; + print "$file:$.: $line"; + $ret = 1; + last; + } + } - # Allow space after keywords only - if ($kw =~ /^(?:if|for|while|switch|return)$/) { - $tmpdata =~ s/(?:$kw\s\()/XXX(/; - } else { - print "Whitespace after non-keyword:\n$$location"; + # Require whitespace immediately after keywords + if ($data =~ /\b(?:if|for|while|switch|return)\(/) { + print "No whitespace after keyword:\n"; + print "$file:$.: $line"; $ret = 1; - last; } - } - # Require whitespace immediately after keywords - if ($$data =~ /\b(?:if|for|while|switch|return)\(/) { - print "No whitespace after keyword:\n$$location"; - $ret = 1; - } - - # Forbid whitespace between )( of a function typedef - if ($$data =~ /\(\*\w+\)\s+\(/) { - print "Whitespace between ')' and '(':\n$$location"; - $ret = 1; - } - - # Forbid whitespace following ( or prior to ) - # but allow whitespace before ) on a single line - # (optionally followed by a semicolon) - if (($$data =~ /\s\)/ && not $$data =~ /^\s+\);?$/) || - $$data =~ /\((?!$)\s/) { - print "Whitespace after '(' or before ')':\n$$location"; - $ret = 1; - } - - # Forbid whitespace before ";" or ",". Things like below are allowed: - # - # 1) The expression is empty for "for" loop. E.g. - # for (i = 0; ; i++) - # - # 2) An empty statement. E.g. - # while (write(statuswrite, &status, 1) == -1 && - # errno == EINTR) - # ; - # - if ($$data =~ /\s[;,]/) { - unless ($$data =~ /\S; ; / || - $$data =~ /^\s+;/) { - print "Whitespace before semicolon or comma:\n$$location"; + # Forbid whitespace between )( of a function typedef + if ($data =~ /\(\*\w+\)\s+\(/) { + print "Whitespace between ')' and '(':\n"; + print "$file:$.: $line"; $ret = 1; } - } - - # Require EOL, macro line continuation, or whitespace after ";". - # Allow "for (;;)" as an exception. - if ($$data =~ /;[^ \\\n;)]/) { - print "Invalid character after semicolon:\n$$location"; - $ret = 1; - } - - # Require EOL, space, or enum/struct end after comma. - if ($$data =~ /,[^ \\\n)}]/) { - print "Invalid character after comma:\n$$location"; - $ret = 1; - } - - # Require spaces around assignment '=', compounds and '==' - if ($$data =~ /[^ ]\b[!<>&|\-+*\/%\^=]?=/ || - $$data =~ /=[^= \\\n]/) { - print "Spacing around '=' or '==':\n$$location"; - $ret = 1; - } - - return $ret; -} -# -# CheckCurlyBrackets: -# $_[0]: $data(in) -# $_[1]: $file(in) -# $_[2]: $line(in) -# $_[3]: $cb_linenum(inout) -# $_[4]: $cb_code(inout) -# $_[5]: $cb_scolon(inout) -# Returns 0 in case of success or 1 on failure -# -# Check whitespaces according to code spec of libvirt. -# -sub CheckCurlyBrackets { - my $ret = 0; - my ($data, $file, $line, $cb_linenum, $cb_code, $cb_scolon) = @_; - - # One line conditional statements with one line bodies should - # not use curly brackets. - if ($$data =~ /^\s*(if|while|for)\b.*\{$/) { - $$cb_linenum = $.; - $$cb_code = $$line; - $$cb_scolon = 0; - } - - # We need to check for exactly one semicolon inside the body, - # because empty statements (e.g. with comment only) are - # allowed - if ($$cb_linenum == $. - 1 && $$data =~ /^[^;]*;[^;]*$/) { - $$cb_code .= $$line; - $$cb_scolon = 1; - } - - if ($$data =~ /^\s*}\s*$/ && - $$cb_linenum == $. - 2 && - $$cb_scolon) { - - print "Curly brackets around single-line body:\n"; - print "$$file:$$cb_linenum-$.:\n$$cb_code$$line"; - $ret = 1; - - # There _should_ be no need to reset the values; but to - # keep my inner peace... - $$cb_linenum = 0; - $$cb_scolon = 0; - $$cb_code = ""; - } - - return $ret; -} - -# -# CheckMisalignment: -# $_[0]: $data(in) -# $_[1]: $file(in) -# $_[2]: $line(in) -# $_[3]: @paren_stack(inout), which maintains information -# of the parenthesis -# Returns 0 in case of success or 1 on failure -# -# Check misaligned stuff in parenthesis: -# 1. For misaligned arguments of function -# 2. For misaligned conditions of [if|while|switch|...] -# -sub CheckMisalignment { - my $ret = 0; - my ($data, $file, $line, $paren_stack) = @_; - - # Check alignment based on @paren_stack - if (@$paren_stack) { - if ($$data =~ /(\S+.*$)/) { - my $pos = $$paren_stack[-1][0]; - my $linenum = $$paren_stack[-1][1]; - my $code = $$paren_stack[-1][2]; - if ($pos + 1 != length($`)) { - my $pad = ""; - if ($. > $linenum + 1) { - $pad = " " x $pos . " ...\n"; - } - print "Misaligned line in parenthesis:\n"; - print "$$file:$linenum-$.:\n$code$pad$$line\n"; - $ret = 1; - } + # Forbid whitespace following ( or prior to ) + # but allow whitespace before ) on a single line + # (optionally followed by a semicolon) + if (($data =~ /\s\)/ && not $data =~ /^\s+\);?$/) || + $data =~ /\((?!$)\s/) { + print "Whitespace after '(' or before ')':\n"; + print "$file:$.: $line"; + $ret = 1; } - } - # Maintain @paren_stack - if ($$data =~ /.*[()]/) { - my $pos = 0; - my $temp = $$data; - - # Kill the content between matched parenthesis and themselves - # within the current line. - $temp =~ s,(\((?:[^()]++|(?R))*+\)),"X" x (length $&),ge; - - # Pop a item for the open-paren when finding close-paren - while (($pos = index($temp, "\)", $pos)) >= 0) { - if (@$paren_stack) { - pop(@$paren_stack); - $pos++; - } else { - print "Warning: found unbalanced parenthesis:\n"; - print "$$file:$.:\n$$line\n"; + # Forbid whitespace before ";" or ",". Things like below are allowed: + # + # 1) The expression is empty for "for" loop. E.g. + # for (i = 0; ; i++) + # + # 2) An empty statement. E.g. + # while (write(statuswrite, &status, 1) == -1 && + # errno == EINTR) + # ; + # + if ($data =~ /\s[;,]/) { + unless ($data =~ /\S; ; / || + $data =~ /^\s+;/) { + print "Whitespace before semicolon or comma:\n"; + print "$file:$.: $line"; $ret = 1; - last; } } - # Push the item for open-paren on @paren_stack - # @item = [ position of the open-paren, linenum, code-line ] - while (($pos = index($temp, "\(", $pos)) >= 0) { - push @$paren_stack, [$pos, $., $$line]; - $pos++; + # Require EOL, macro line continuation, or whitespace after ";". + # Allow "for (;;)" as an exception. + if ($data =~ /;[^ \\\n;)]/) { + print "Invalid character after semicolon:\n"; + print "$file:$.: $line"; + $ret = 1; } - } - return $ret; -} - -my $ret = 0; - -foreach my $file (@ARGV) { - # Per-file variables for multiline Curly Bracket (cb_) check - my $cb_linenum = 0; - my $cb_code = ""; - my $cb_scolon = 0; - my $fn_linenum = 0; - my $incomment = 0; - my @paren_stack; - - open FILE, $file; - - while (defined (my $line = <FILE>)) { - my $has_define = 0; - my $data = $line; - my $location = "$file:$.:\n$line"; - - # Kill any quoted , ; = or " - $data =~ s/'[";,=]'/'X'/g; - - # Kill any quoted strings. Replace with equal-length "XXXX..." - $data =~ s,"(([^\\\"]|\\.)*)","\"".'X'x(length $1)."\"",ge; - $data =~ s,'(([^\\\']|\\.)*)',"\'".'X'x(length $1)."\'",ge; + # Require EOL, space, or enum/struct end after comma. + if ($data =~ /,[^ \\\n)}]/) { + print "Invalid character after comma:\n"; + print "$file:$.: $line"; + $ret = 1; + } - # Kill any C++ style comments - $data =~ s,//.*$,//,; + # Require spaces around assignment '=', compounds and '==' + if ($data =~ /[^ ]\b[!<>&|\-+*\/%\^=]?=/ || + $data =~ /=[^= \\\n]/) { + print "Spacing around '=' or '==':\n"; + print "$file:$.: $line"; + $ret = 1; + } - $has_define = 1 if $data =~ /(?:^#\s*define\b)/; - if (not $has_define) { - # Ignore all macros except for #define - next if $data =~ /^#/; + # One line conditional statements with one line bodies should + # not use curly brackets. + if ($data =~ /^\s*(if|while|for)\b.*\{$/) { + $cb_linenum = $.; + $cb_code = $line; + $cb_scolon = 0; + } - $ret = 1 if CheckFunctionBody(\$data, \$location, \$fn_linenum); + # We need to check for exactly one semicolon inside the body, + # because empty statements (e.g. with comment only) are + # allowed + if ($cb_linenum == $. - 1 && $data =~ /^[^;]*;[^;]*$/) { + $cb_code .= $line; + $cb_scolon = 1; + } - KillComments(\$data, \$incomment); + if ($data =~ /^\s*}\s*$/ && + $cb_linenum == $. - 2 && + $cb_scolon) { - $ret = 1 if CheckWhiteSpaces(\$data, \$location); + print "Curly brackets around single-line body:\n"; + print "$file:$cb_linenum-$.:\n$cb_code$line"; + $ret = 1; - $ret = 1 if CheckCurlyBrackets(\$data, \$file, \$line, - \$cb_linenum, \$cb_code, \$cb_scolon); + # There _should_ be no need to reset the values; but to + # keep my inner peace... + $cb_linenum = 0; + $cb_scolon = 0; + $cb_code = ""; } - - ##################################################################### - # Temporary Filter for CheckMisalignment: - # Here we introduce a white-list of path, since there're - # too much misalignment. - # We _need_ fix these misalignment in batches. - # We _should_ remove it as soon as fixing all. - ##################################################################### - next unless $file =~ /^src\/util\//; - - $ret = 1 if CheckMisalignment(\$data, \$file, \$line, \@paren_stack); } close FILE; } -- 2.16.4 -- libvir-list mailing list libvir-list@xxxxxxxxxx https://www.redhat.com/mailman/listinfo/libvir-list