From: Steve Hancock <perltidy@users.sourceforge.net>
Date: Tue, 16 Aug 2022 03:23:16 +0000 (-0700)
Subject: add continuation indentation to C-style 'for' terms
X-Git-Tag: 20220613.05~50
X-Git-Url: https://git.donarmstrong.com/?a=commitdiff_plain;h=47b24771cd9ac201ee8d710234b07070555391ae;p=perltidy.git

add continuation indentation to C-style 'for' terms
---

diff --git a/CHANGES.md b/CHANGES.md
index bc61bdd7..e400c4fe 100644
--- a/CHANGES.md
+++ b/CHANGES.md
@@ -42,6 +42,26 @@
       # perltidy -drc:
             ignoreSpec( $file, "file", \%spec, \%Rspec );
 
+    - Add continuation indentation to long C-style 'for' terms; i.e.
+
+            # OLD
+            for (
+                $j = $i - $shell ;
+                $j >= 0
+                && ++$ncomp
+                && $array->[$j] gt $array->[ $j + $shell ] ;
+                $j -= $shell
+              )
+
+            # NEW
+            for (
+                $j = $i - $shell ;
+                $j >= 0
+                  && ++$ncomp
+                  && $array->[$j] gt $array->[ $j + $shell ] ;
+                $j -= $shell
+              )
+
     - Fixed an inconsistency in html colors near pointers when -html is used.
       Previously, a '->' at the end of a line got the 'punctuation color', black
       by default but a '->' before an identifier got the color of the following
diff --git a/lib/Perl/Tidy/Formatter.pm b/lib/Perl/Tidy/Formatter.pm
index 25ab6d00..d88fd802 100644
--- a/lib/Perl/Tidy/Formatter.pm
+++ b/lib/Perl/Tidy/Formatter.pm
@@ -519,7 +519,7 @@ BEGIN {
         _rix_seqno_controlling_ci_   => $i++,
         _batch_CODE_type_            => $i++,
         _ri_starting_one_line_block_ => $i++,
-        _has_unmatched_opening_      => $i++,
+        _runmatched_opening_indexes_ => $i++,
     };
 }
 
@@ -6197,11 +6197,6 @@ my $Klast_old;
 my $Klast_old_code;
 my $CODE_type;
 
-##Possible closure variables:
-##my $Kfirst;
-##my $Klast;
-##my $input_line_number;
-
 my $rwhitespace_flags;
 
 sub initialize_respace_tokens_closure {
@@ -6233,6 +6228,7 @@ sub initialize_respace_tokens_closure {
     $roverride_cab3            = $self->[_roverride_cab3_];
     $rparent_of_seqno          = $self->[_rparent_of_seqno_];
     $rtype_count_by_seqno      = $self->[_rtype_count_by_seqno_];
+    $rblock_type_of_seqno      = $self->[_rblock_type_of_seqno_];
 
     # Note that $K_opening_container and $K_closing_container have values
     # defined in sub get_line() for the previous K indexes.  They were needed
@@ -6244,8 +6240,6 @@ sub initialize_respace_tokens_closure {
 
     %K_first_here_doc_by_seqno = ();
 
-    $rblock_type_of_seqno = $self->[_rblock_type_of_seqno_];
-
     $last_nonblank_code_type       = ';';
     $last_nonblank_code_token      = ';';
     $last_nonblank_block_type      = EMPTY_STRING;
@@ -6266,11 +6260,6 @@ sub initialize_respace_tokens_closure {
     $Klast_old_code = undef;          # K of last token if side comment
     $CODE_type      = EMPTY_STRING;
 
-    ##possible closure variables:
-    ##$Kfirst         = undef;
-    ##$Klast          = undef;
-    ##$input_line_number = undef;
-
     # Set the whitespace flags, which indicate the token spacing preference.
     $rwhitespace_flags = $self->set_whitespace_flags();
 
@@ -6825,6 +6814,7 @@ sub respace_post_loop_ops {
     }
 
     # Find and remember lists by sequence number
+    my %is_C_style_for;
     foreach my $seqno ( keys %{$K_opening_container} ) {
         my $K_opening = $K_opening_container->{$seqno};
         next unless defined($K_opening);
@@ -6844,7 +6834,11 @@ sub respace_post_loop_ops {
         if ($rtype_count) {
             my $comma_count     = $rtype_count->{','};
             my $fat_comma_count = $rtype_count->{'=>'};
-            my $semicolon_count = $rtype_count->{';'} || $rtype_count->{'f'};
+            my $semicolon_count = $rtype_count->{';'};
+            if ( $rtype_count->{'f'} ) {
+                $semicolon_count += $rtype_count->{'f'};
+                $is_C_style_for{$seqno} = 1;
+            }
 
             # We will define a list to be a container with one or more commas
             # and no semicolons. Note that we have included the semicolons
@@ -7006,6 +7000,20 @@ sub respace_post_loop_ops {
             }
         }
     }
+
+    # Add -ci to C-style for loops (issue c154)
+    # This is much easier to do here than in the tokenizer.
+    foreach my $seqno ( keys %is_C_style_for ) {
+        my $K_opening = $K_opening_container->{$seqno};
+        my $K_closing = $K_closing_container->{$seqno};
+        my $type_last = 'f';
+        for my $KK ( $K_opening + 1 .. $K_closing - 1 ) {
+            $rLL_new->[$KK]->[_CI_LEVEL_] = $type_last eq 'f' ? 0 : 1;
+            my $type = $rLL_new->[$KK]->[_TYPE_];
+            if ( $type ne 'b' && $type ne '#' ) { $type_last = $type }
+        }
+    }
+
     return;
 } ## end sub respace_post_loop_ops
 
@@ -14551,9 +14559,8 @@ EOM
     my $peak_batch_size;
     my $batch_count;
 
-    # variables to keep track of unbalanced containers.
+    # variables to keep track of indentation of unmatched containers.
     my %saved_opening_indentation;
-    my @unmatched_opening_indexes_in_this_batch;
 
     sub initialize_grind_batch_of_CODE {
         @nonblank_lines_at_depth   = ();
@@ -14706,9 +14713,7 @@ EOM
         # Normal route
         #-------------
 
-        my $rLL                      = $self->[_rLL_];
-        my $ris_seqno_controlling_ci = $self->[_ris_seqno_controlling_ci_];
-        my $rwant_container_open     = $self->[_rwant_container_open_];
+        my $rLL = $self->[_rLL_];
 
         #-------------------------------------------------------
         # Loop over the batch to initialize some batch variables
@@ -14720,9 +14725,9 @@ EOM
         my %comma_arrow_count;
         my $comma_arrow_count_contained = 0;
         my @unmatched_closing_indexes_in_this_batch;
+        my @unmatched_opening_indexes_in_this_batch;
 
-        @unmatched_opening_indexes_in_this_batch = ();
-
+        my @i_for_semicolon;
         foreach my $i ( 0 .. $max_index_to_go ) {
             $iprev_to_go[$i] = $ilast_nonblank;
             $inext_to_go[$i] = $i + 1;
@@ -14742,12 +14747,12 @@ EOM
 
                 # remember indexes of any tokens controlling xci
                 # in this batch. This list is needed by sub undo_ci.
-                if ( $ris_seqno_controlling_ci->{$seqno} ) {
+                if ( $self->[_ris_seqno_controlling_ci_]->{$seqno} ) {
                     push @ix_seqno_controlling_ci, $i;
                 }
 
                 if ( $is_opening_sequence_token{$token} ) {
-                    if ( $rwant_container_open->{$seqno} ) {
+                    if ( $self->[_rwant_container_open_]->{$seqno} ) {
                         $self->set_forced_breakpoint($i);
                     }
                     push @unmatched_opening_indexes_in_this_batch, $i;
@@ -14757,7 +14762,7 @@ EOM
                 }
                 elsif ( $is_closing_sequence_token{$token} ) {
 
-                    if ( $i > 0 && $rwant_container_open->{$seqno} ) {
+                    if ( $i > 0 && $self->[_rwant_container_open_]->{$seqno} ) {
                         $self->set_forced_breakpoint( $i - 1 );
                     }
 
@@ -14795,13 +14800,28 @@ EOM
                     $comma_arrow_count{$seqno}++;
                 }
             }
+            elsif ( $type eq 'f' ) {
+                push @i_for_semicolon, $i;
+            }
+
         } ## end for ( my $i = 0 ; $i <=...)
 
+        # Break at a single interior C-style for semicolon in this batch (c154)
+        if ( @i_for_semicolon == 1 ) {
+            my $i     = $i_for_semicolon[0];
+            my $inext = $inext_to_go[$i];
+            if ( $inext <= $max_index_to_go && $types_to_go[$inext] ne '#' ) {
+                $self->set_forced_breakpoint($i);
+            }
+        }
+
         my $is_unbalanced_batch = @unmatched_opening_indexes_in_this_batch +
           @unmatched_closing_indexes_in_this_batch;
 
-        $this_batch->[_has_unmatched_opening_] =
-          @unmatched_opening_indexes_in_this_batch;
+        if (@unmatched_opening_indexes_in_this_batch) {
+            $this_batch->[_runmatched_opening_indexes_] =
+              \@unmatched_opening_indexes_in_this_batch;
+        }
 
         #------------------------
         # Set special breakpoints
@@ -15183,7 +15203,12 @@ EOM
         # saves indentations of lines of all unmatched opening tokens.
         # These will be used by sub get_opening_indentation.
 
-        my ( $self, $ri_first, $ri_last, $rindentation_list ) = @_;
+        my ( $self, $ri_first, $ri_last, $rindentation_list,
+            $runmatched_opening_indexes )
+          = @_;
+
+        $runmatched_opening_indexes = []
+          if ( !defined($runmatched_opening_indexes) );
 
         # QW INDENTATION PATCH 1:
         # Also save indentation for multiline qw quotes
@@ -15200,7 +15225,7 @@ EOM
 
         # we need to save indentations of any unmatched opening tokens
         # in this batch because we may need them in a subsequent batch.
-        foreach ( @unmatched_opening_indexes_in_this_batch, @i_qw ) {
+        foreach ( @{$runmatched_opening_indexes}, @i_qw ) {
 
             my $seqno = $type_sequence_to_go[$_];
 
@@ -18879,6 +18904,7 @@ EOM
         %quick_filter = %is_assignment;
         @q            = qw# => . ; < > ~ #;
         push @q, ',';
+        push @q, 'f';    # added for ';' for issue c154
         @quick_filter{@q} = (1) x scalar(@q);
     }
 
@@ -19245,12 +19271,15 @@ EOM
             # not a list.  Note that '=' could be in any of the = operators
             # (lextest.t). We can't just use the reported environment
             # because it can be incorrect in some cases.
-            elsif ( ( $type =~ /^[\;\<\>\~]$/ || $is_assignment{$type} )
+            elsif ( ( $type =~ /^[\;\<\>\~f]$/ || $is_assignment{$type} )
                 && !$self->is_in_list_by_i($i) )
             {
                 $dont_align[$depth]         = 1;
                 $want_comma_break[$depth]   = 0;
                 $index_before_arrow[$depth] = -1;
+
+                # no special comma breaks in C-style 'for' terms (c154)
+                if ( $type eq 'f' ) { $last_comma_index[$depth] = undef }
             }
 
             # now just handle any commas
@@ -19922,12 +19951,13 @@ EOM
             }
         }
 
+        # break long terms at any C-style for semicolons (c154)
         if ( $is_long_term
             && @{ $rfor_semicolon_list[$current_depth] } )
         {
             $self->set_for_semicolon_breakpoints($current_depth);
 
-            # open up a long 'for' or 'foreach' container to allow
+            # and open up a long 'for' or 'foreach' container to allow
             # leading term alignment unless -lp is used.
             $has_comma_breakpoints = 1 unless ($lp_object);
         }
@@ -23004,8 +23034,9 @@ EOM
 
     # remember indentation of lines containing opening containers for
     # later use by sub final_indentation_adjustment
-    $self->save_opening_indentation( $ri_first, $ri_last, $rindentation_list )
-      if ( $this_batch->[_has_unmatched_opening_]
+    $self->save_opening_indentation( $ri_first, $ri_last, $rindentation_list,
+        $this_batch->[_runmatched_opening_indexes_] )
+      if ( $this_batch->[_runmatched_opening_indexes_]
         || $types_to_go[$max_index_to_go] eq 'q' );
 
     # output any new -cscw block comment
@@ -23990,9 +24021,6 @@ sub get_seqno {
                         $ok_comma = $tok_next_next eq $tok_next;
                     }
 
-                    # no padding of C-style 'for' terms ('f' is ';' c154)
-                    next if ( $types_to_go[$iendm] eq 'f' );
-
                     next
                       unless (
                            $is_assignment{ $types_to_go[$iendm] }
diff --git a/t/snippets/c154.in b/t/snippets/c154.in
new file mode 100644
index 00000000..d532a9eb
--- /dev/null
+++ b/t/snippets/c154.in
@@ -0,0 +1,38 @@
+{{{{
+for (
+    $order =
+    $start_order * $nbSubOrderByOrder + $start_suborder ;
+    !exists $level_hash{$level}->{$order}
+    and $order <=
+    $stop_order * $nbSubOrderByOrder + $stop_suborder ;
+    $order++
+  )
+{
+}
+
+# has comma
+for (
+    $q = 201 ;
+    print '-' x 79,
+    "\n" ;
+    $g = (
+	$f ^ ( $w = ( $z = $m . $e ) ^ substr $e, $q )
+	  ^ ( $n = $b ^ $d | $a ^ $l )
+    ) & ( $w | $z ^ $f ^ $n ) & ( $l | $g )
+  )
+{
+    ...;
+}
+
+for (
+    $j = 0, $match_j = -1 ;
+    $j < $sub_len
+      &&
+
+      # changed from naive_string_matcher
+      $sub->[$j] eq $big->[ $i + $j ] ; $j++
+  )
+{
+    ...;
+}
+}}}}
diff --git a/t/snippets/expect/c154.def b/t/snippets/expect/c154.def
new file mode 100644
index 00000000..238900d5
--- /dev/null
+++ b/t/snippets/expect/c154.def
@@ -0,0 +1,44 @@
+{
+    {
+        {
+            {
+                for (
+                    $order =
+                      $start_order * $nbSubOrderByOrder + $start_suborder ;
+                    !exists $level_hash{$level}->{$order}
+                      and $order <=
+                      $stop_order * $nbSubOrderByOrder + $stop_suborder ;
+                    $order++
+                  )
+                {
+                }
+
+                # has comma
+                for (
+                    $q = 201 ;
+                    print '-' x 79, "\n" ;
+                    $g = (
+                          $f ^ ( $w = ( $z = $m . $e ) ^ substr $e, $q )
+                          ^ ( $n = $b ^ $d | $a ^ $l )
+                    ) & ( $w | $z ^ $f ^ $n ) & ( $l | $g )
+                  )
+                {
+                    ...;
+                }
+
+                for (
+                    $j = 0, $match_j = -1 ;
+                    $j < $sub_len
+                      &&
+
+                      # changed from naive_string_matcher
+                      $sub->[$j] eq $big->[ $i + $j ] ;
+                    $j++
+                  )
+                {
+                    ...;
+                }
+            }
+        }
+    }
+}
diff --git a/t/snippets/packing_list.txt b/t/snippets/packing_list.txt
index 17cc5a2c..a88b7d6f 100644
--- a/t/snippets/packing_list.txt
+++ b/t/snippets/packing_list.txt
@@ -357,6 +357,8 @@
 ../snippets26.t	drc.def
 ../snippets26.t	drc.drc
 ../snippets26.t	git105.def
+../snippets26.t	git106.def
+../snippets26.t	git106.git106
 ../snippets3.t	ce_wn1.ce_wn
 ../snippets3.t	ce_wn1.def
 ../snippets3.t	colin.colin
@@ -497,5 +499,4 @@
 ../snippets9.t	rt98902.def
 ../snippets9.t	rt98902.rt98902
 ../snippets9.t	rt99961.def
-../snippets26.t	git106.def
-../snippets26.t	git106.git106
+../snippets26.t	c154.def
diff --git a/t/snippets26.t b/t/snippets26.t
index ea51de6a..8b4c563b 100644
--- a/t/snippets26.t
+++ b/t/snippets26.t
@@ -14,6 +14,7 @@
 #11 git105.def
 #12 git106.def
 #13 git106.git106
+#14 c154.def
 
 # To locate test #13 you can search for its name or the string '#13'
 
@@ -102,6 +103,47 @@ _
 $r = $c->         
 
 sql_set_env_attr( $evh, $SQL_ATTR_ODBC_VERSION, $SQL_OV_ODBC2, 0 );
+----------
+
+        'c154' => <<'----------',
+{{{{
+for (
+    $order =
+    $start_order * $nbSubOrderByOrder + $start_suborder ;
+    !exists $level_hash{$level}->{$order}
+    and $order <=
+    $stop_order * $nbSubOrderByOrder + $stop_suborder ;
+    $order++
+  )
+{
+}
+
+# has comma
+for (
+    $q = 201 ;
+    print '-' x 79,
+    "\n" ;
+    $g = (
+	$f ^ ( $w = ( $z = $m . $e ) ^ substr $e, $q )
+	  ^ ( $n = $b ^ $d | $a ^ $l )
+    ) & ( $w | $z ^ $f ^ $n ) & ( $l | $g )
+  )
+{
+    ...;
+}
+
+for (
+    $j = 0, $match_j = -1 ;
+    $j < $sub_len
+      &&
+
+      # changed from naive_string_matcher
+      $sub->[$j] eq $big->[ $i + $j ] ; $j++
+  )
+{
+    ...;
+}
+}}}}
 ----------
 
         'drc' => <<'----------',
@@ -620,6 +662,57 @@ abcdefghijklmnopq
 }
 #13...........
         },
+
+        'c154.def' => {
+            source => "c154",
+            params => "def",
+            expect => <<'#14...........',
+{
+    {
+        {
+            {
+                for (
+                    $order =
+                      $start_order * $nbSubOrderByOrder + $start_suborder ;
+                    !exists $level_hash{$level}->{$order}
+                      and $order <=
+                      $stop_order * $nbSubOrderByOrder + $stop_suborder ;
+                    $order++
+                  )
+                {
+                }
+
+                # has comma
+                for (
+                    $q = 201 ;
+                    print '-' x 79, "\n" ;
+                    $g = (
+                          $f ^ ( $w = ( $z = $m . $e ) ^ substr $e, $q )
+                          ^ ( $n = $b ^ $d | $a ^ $l )
+                    ) & ( $w | $z ^ $f ^ $n ) & ( $l | $g )
+                  )
+                {
+                    ...;
+                }
+
+                for (
+                    $j = 0, $match_j = -1 ;
+                    $j < $sub_len
+                      &&
+
+                      # changed from naive_string_matcher
+                      $sub->[$j] eq $big->[ $i + $j ] ;
+                    $j++
+                  )
+                {
+                    ...;
+                }
+            }
+        }
+    }
+}
+#14...........
+        },
     };
 
     my $ntests = 0 + keys %{$rtests};