From: Steve Hancock <perltidy@users.sourceforge.net>
Date: Tue, 30 Jun 2020 15:15:06 +0000 (-0700)
Subject: improved vertical alignment and added new test cases
X-Git-Tag: 20200619.02~7
X-Git-Url: https://git.donarmstrong.com/?a=commitdiff_plain;h=3232d3f93f11eb70ea244efee3c967b769a2cdc1;p=perltidy.git

improved vertical alignment and added new test cases
---

diff --git a/lib/Perl/Tidy/Formatter.pm b/lib/Perl/Tidy/Formatter.pm
index 42dd927d..a9ef21ed 100644
--- a/lib/Perl/Tidy/Formatter.pm
+++ b/lib/Perl/Tidy/Formatter.pm
@@ -10776,7 +10776,8 @@ sub send_lines_to_vertical_aligner {
             # These are used below to prevent unwanted cross-line alignments.
             # Unbalanced containers already avoid aligning across
             # container boundaries.
-            my $tok = $tokens_to_go[$i];
+            my $tok        = $tokens_to_go[$i];
+            my $depth_last = $depth;
             if ( $tok =~ /^[\(\{\[]/ ) {    #'(' ) {
 
                 # if container is balanced on this line...
@@ -10880,8 +10881,12 @@ sub send_lines_to_vertical_aligner {
                 # also decorate commas with any container name to avoid
                 # unwanted cross-line alignments.
                 if ( $raw_tok eq ',' || $raw_tok eq '=>' ) {
-                    if ( $container_name[$depth] ) {
-                        $tok .= $container_name[$depth];
+
+                    # If we are at an opening token which increased depth, we have
+                    # to use the name from the previous depth.
+                    my $depth_p = ( $depth_last < $depth ? $depth_last : $depth );
+                    if ( $container_name[$depth_p] ) {
+                        $tok .= $container_name[$depth_p];
                     }
                 }
 
diff --git a/lib/Perl/Tidy/VerticalAligner.pm b/lib/Perl/Tidy/VerticalAligner.pm
index 086bd300..c1222c47 100644
--- a/lib/Perl/Tidy/VerticalAligner.pm
+++ b/lib/Perl/Tidy/VerticalAligner.pm
@@ -2903,10 +2903,37 @@ sub delete_unmatched_tokens {
 
 sub get_line_token_info {
 
-    # Scan lines of tokens and return summary information about the range of
+    # scan lines of tokens and return summary information about the range of
     # levels and patterns.
     my ($rlines) = @_;
 
+    # First scan to check monotonicity. Here is an example of several
+    # lines which are monotonic. The = is the lowest level, and
+    # the commas are all one level deeper. So this is not nonmonotonic.
+    #  $$d{"weeks"}   = [ "w",  "wk",  "wks", "week", "weeks" ];
+    #  $$d{"days"}    = [ "d",  "day", "days" ];
+    #  $$d{"hours"}   = [ "h",  "hr",  "hrs", "hour", "hours" ];
+    my @all_token_info;
+    my $all_monotonic = 1;
+    for ( my $jj = 0 ; $jj < @{$rlines} ; $jj++ ) {
+        my ($line) = $rlines->[$jj];
+        my $rtokens = $line->get_rtokens();
+        my $last_lev;
+        my $is_monotonic = 1;
+        my $i            = -1;
+        foreach my $tok ( @{$rtokens} ) {
+            $i++;
+            my ( $raw_tok, $lev, $tag, $tok_count ) =
+              decode_alignment_token($tok);
+            push @{ $all_token_info[$jj] },
+              [ $raw_tok, $lev, $tag, $tok_count ];
+            last if ( $tok eq '#' );
+            if ( $i > 0 && $lev < $last_lev ) { $is_monotonic = 0 }
+            $last_lev = $lev;
+        }
+        if ( !$is_monotonic ) { $all_monotonic = 0 }
+    }
+
     my $rline_values = [];
     for ( my $jj = 0 ; $jj < @{$rlines} ; $jj++ ) {
         my ($line) = $rlines->[$jj];
@@ -2917,16 +2944,18 @@ sub get_line_token_info {
         my $token_pattern_max = "";
         my %saw_level;
         my @token_info;
+        my $is_monotonic = 1;
 
-        # Find the index of the last token before the side comment
+        # find the index of the last token before the side comment
         my $imax = @{$rtokens} - 2;
 
-        # But if the line ends in a comma list, walk it back to the first such
-        # comma. This will have the effect of making all trailing ragged comma
-        # lists match in the prune tree routine.  These trailing comma lists
-        # can better be handled by later alignment rules.
+	# If the entire group is monotonic, and the line ends in a comma list,
+	# walk it back to the first such comma. this will have the effect of
+	# making all trailing ragged comma lists match in the prune tree
+	# routine.  these trailing comma lists can better be handled by later
+	# alignment rules.
         my $tok_end = $rtokens->[$imax];
-        if ( $tok_end =~ /^,/ ) {
+        if ( $all_monotonic && $tok_end =~ /^,/ ) {
             my $i = $imax - 1;
             while ( $i >= 0 && $rtokens->[$i] eq $tok_end ) {
                 $imax = $i;
@@ -2935,12 +2964,14 @@ sub get_line_token_info {
         }
 
         # make a first pass to find level range
+        my $last_lev;
         foreach my $tok ( @{$rtokens} ) {
             $i++;
             last if ( $i > $imax );
+            last if ($tok eq '#');
             my ( $raw_tok, $lev, $tag, $tok_count ) =
-              decode_alignment_token($tok);
-            push @token_info, [ $raw_tok, $lev, $tag, $tok_count ];
+              @{$all_token_info[$jj]->[$i]};
+
             last if ( $tok eq '#' );
             $token_pattern_max .= $tok;
             $saw_level{$lev}++;
@@ -2949,9 +2980,11 @@ sub get_line_token_info {
                 $lev_max = $lev;
             }
             else {
-                if ( $lev < $lev_min ) { $lev_min = $lev; }
-                if ( $lev > $lev_max ) { $lev_max = $lev; }
+                if ( $lev < $lev_min )  { $lev_min      = $lev; }
+                if ( $lev > $lev_max )  { $lev_max      = $lev; }
+                if ( $lev < $last_lev ) { $is_monotonic = 0 }
             }
+            $last_lev = $lev;
         }
 
         # handle no levels
@@ -2977,14 +3010,15 @@ sub get_line_token_info {
             $rtoken_patterns->{$lev_max} = $token_pattern_max;
             $rtoken_indexes->{$lev_max}  = [ ( 0 .. $imax ) ];
 
-            my $DEBUG   = 0;
+            my $debug = 0;
             my $lev_top = pop @levs;    # alread did max level
             my $itok    = -1;
             foreach my $tok ( @{$rtokens} ) {
                 $itok++;
                 last if ( $itok > $imax );
+                ##my ( $raw_tok, $lev, $tag, $tok_count ) = @{ $token_info[$itok] };
                 my ( $raw_tok, $lev, $tag, $tok_count ) =
-                  @{ $token_info[$itok] };
+                  @{$all_token_info[$jj]->[$itok]};
                 last if ( $raw_tok eq '#' );
                 foreach my $lev_test (@levs) {
                     next if ( $lev > $lev_test );
@@ -2996,9 +3030,12 @@ sub get_line_token_info {
         }
 
         push @{$rline_values},
-          [ $lev_min, $lev_max, $rtoken_patterns, \@levs, $rtoken_indexes, ];
+          [
+            $lev_min, $lev_max,        $rtoken_patterns,
+            \@levs,   $rtoken_indexes, $is_monotonic
+          ];
 
-        # DEBUG
+        # debug
         0 && do {
             local $" = ')(';
             print "lev_min=$lev_min, lev_max=$lev_max, levels=(@levs)\n";
@@ -3276,6 +3313,7 @@ sub prune_alignment_tree {
     #  $jbeg..$jend is the range of line indexes,
     #  $level_keep is the minimum level to keep
     my @delete_list;
+    my %end_group;
 
     my $starting_depth = 0;    # normally 0 except for debugging
 
@@ -3296,25 +3334,49 @@ sub prune_alignment_tree {
             # nothing to do if no children
             next unless defined($nc_beg_p);
 
-            # Define the number of lines to either keep or delete a child node.
-            # This is the key decision we have to make.  We want to delete
-            # short runs of matched lines, and keep long runs.  The following
-            # rule has given good results but it might be optimized in the
-            # future to include more variables.
-            my $nlines_keep = $depth + 3;
-            my $nlines_p    = $jend_p - $jbeg_p + 1;
-            if ( $nlines_keep > $nlines_p - 1 ) { $nlines_keep = $nlines_p - 1 }
+	    # Define the number of lines to either keep or delete a child node.
+	    # This is the key decision we have to make.  We want to delete
+	    # short runs of matched lines, and keep long runs.  It seems easier
+	    # for the eye to follow breaks in monotonic level changes than
+	    # non-monotonic level changes.  For example, the following looks
+	    # best if we delete the lower level alignments:
+
+            #  [1]                  ~~ [];
+            #  [ ["foo"], ["bar"] ] ~~ [ qr/o/, qr/a/ ];
+            #  [ qr/o/, qr/a/ ]     ~~ [ ["foo"], ["bar"] ];
+            #  [ "foo", "bar" ]     ~~ [ qr/o/, qr/a/ ];
+            #  [ qr/o/, qr/a/ ]     ~~ [ "foo", "bar" ];
+            #  $deep1               ~~ $deep1;
+
+            # So we will use two thresholds.  
+            my $nmin_mono     = $depth + 3;
+            my $nmin_non_mono = $depth + 6;
+            my $nlines_p          = $jend_p - $jbeg_p + 1;
+            if ( $nmin_mono > $nlines_p - 1 ) {
+                $nmin_mono = $nlines_p - 1;
+            }
+            if ( $nmin_non_mono > $nlines_p - 1 ) {
+                $nmin_non_mono = $nlines_p - 1;
+            }
 
             # loop to keep or delete each child node
+            my $jend_c_keep;
             foreach my $nc ( $nc_beg_p .. $nc_end_p ) {
                 my ( $jbeg_c, $jend_c, $np_c, $lev_c, $pat_c, $nc_beg_c,
                     $nc_end_c )
                   = @{ $match_tree[ $depth + 1 ]->[$nc] };
                 my $nlines_c = $jend_c - $jbeg_c + 1;
-                if ( $nlines_c < $nlines_keep ) {
+                my $is_monotonic = $rline_values->[$jbeg_c]->[5];
+                my $nmin = $is_monotonic ? $nmin_mono : $nmin_non_mono;
+                if ( $nlines_c < $nmin ) {
                     push @delete_list, [ $jbeg_c, $jend_c, $lev_p ];
                 }
                 else {
+                    if ( defined($jend_c_keep) && $jbeg_c == $jend_c_keep + 1 )
+                    {
+                        $rlines->[$jend_c_keep]->{_end_group} = 1;
+                    }
+                    $jend_c_keep = $jend_c;
                     push @todo_next, $nc;
                 }
             }
@@ -3356,7 +3418,6 @@ sub Dump_tree_groups {
         my @fix = @{$item};
         foreach (@fix) { $_ = "undef" unless defined $_; }
         $fix[4] = "...";
-        $fix[7] = "...";
         print "(@fix)\n";
     }
 }
diff --git a/t/snippets/align25.in b/t/snippets/align25.in
index ad093b97..ce545d2a 100644
--- a/t/snippets/align25.in
+++ b/t/snippets/align25.in
@@ -1,4 +1,4 @@
-# do not align commas here; different container types
+# do not align internal commas here; different container types
 is_deeply( [ $a,        $a ], [ $b,               $c ] );
 is_deeply( { foo => $a, bar => $a }, { foo => $b, bar => $c } );
 is_deeply( [ \$a,       \$a ], [ \$b,             \$c ] );
diff --git a/t/snippets/expect/align25.def b/t/snippets/expect/align25.def
index 72d462cf..3b1434f6 100644
--- a/t/snippets/expect/align25.def
+++ b/t/snippets/expect/align25.def
@@ -1,5 +1,5 @@
-# do not align commas here; different container types
-is_deeply( [ $a, $a ], [ $b, $c ] );
+# do not align internal commas here; different container types
+is_deeply( [ $a, $a ],               [ $b, $c ] );
 is_deeply( { foo => $a, bar => $a }, { foo => $b, bar => $c } );
-is_deeply( [ \$a, \$a ], [ \$b, \$c ] );
+is_deeply( [ \$a, \$a ],             [ \$b, \$c ] );
 
diff --git a/t/snippets/expect/prune.def b/t/snippets/expect/prune.def
index 1b7e8688..205d840a 100644
--- a/t/snippets/expect/prune.def
+++ b/t/snippets/expect/prune.def
@@ -31,3 +31,21 @@ $_SetCommState = ff( "k32", "SetCommState", [ N, P ],                I );
 $_SetupComm    = ff( "k32", "SetupComm",    [ N, N, N ],             I );
 $_PurgeComm    = ff( "k32", "PurgeComm",    [ N, N ],                I );
 $_CreateEvent  = ff( "k32", "CreateEvent",  [ P, I, I, P ],          N );
+
+is_deeply \@t, [
+
+    [3],            [0],            [1],            [0],
+    3,              [1],            3,              [1],
+    2,              [0],            [1],            [0],
+    [1],            [1],            [1],            2,
+    3,              [1],            2,              [3],
+    4,              [ 7, 8 ],       9,              ["a"],
+    "b",            3,              2,              5,
+    3,              2,              5,              3,
+    [2],            5,              4,              5,
+    [ 3, 2, 1 ],    1,              2,              3,
+    [ -1, -2, -3 ], [ -1, -2, -3 ], [ -1, -2, -3 ], [ -1, -2 ],
+    3,              [ -1, -2 ],     3,              [ -1, -2, -3 ],
+    [ !1 ],         [ 8, 7, 6 ],    [ 8, 7, 6 ],    [4],
+    !!0,
+];
diff --git a/t/snippets/make_expect.pl b/t/snippets/make_expect.pl
index cdbc678b..e80e23a9 100755
--- a/t/snippets/make_expect.pl
+++ b/t/snippets/make_expect.pl
@@ -275,8 +275,8 @@ EOM
     if ( -e $diff_file ) {
         $diff_msg = <<EOM;
 Look at each differences in '$diff_file'
-The full old ouput for 'somefile.def' is in expect/somefile.def
-The full new ouput for 'somefile.def' is in tmp/somefile.def
+The full old output for 'somefile.def' is in expect/somefile.def
+The full new output for 'somefile.def' is in tmp/somefile.def
 EOM
 
     }
diff --git a/t/snippets/packing_list.txt b/t/snippets/packing_list.txt
index c512946a..21da717f 100644
--- a/t/snippets/packing_list.txt
+++ b/t/snippets/packing_list.txt
@@ -256,6 +256,7 @@
 ../snippets21.t	switch_plain.switch_plain
 ../snippets21.t	sot.def
 ../snippets21.t	sot.sot
+../snippets21.t	prune.def
 ../snippets3.t	ce_wn1.ce_wn
 ../snippets3.t	ce_wn1.def
 ../snippets3.t	colin.colin
@@ -396,4 +397,3 @@
 ../snippets9.t	rt98902.def
 ../snippets9.t	rt98902.rt98902
 ../snippets9.t	rt99961.def
-../snippets21.t	prune.def
diff --git a/t/snippets/prune.in b/t/snippets/prune.in
index 1b7e8688..90d43387 100644
--- a/t/snippets/prune.in
+++ b/t/snippets/prune.in
@@ -31,3 +31,22 @@ $_SetCommState = ff( "k32", "SetCommState", [ N, P ],                I );
 $_SetupComm    = ff( "k32", "SetupComm",    [ N, N, N ],             I );
 $_PurgeComm    = ff( "k32", "PurgeComm",    [ N, N ],                I );
 $_CreateEvent  = ff( "k32", "CreateEvent",  [ P, I, I, P ],          N );
+
+
+is_deeply \@t, [
+
+ [3],  [0],  [1],  [0],
+ 3,   [1],  3,   [1],
+ 2,   [0],  [1],  [0],
+ [1],  [1],  [1],  2,
+ 3,   [1],  2,   [3],
+ 4,   [ 7, 8 ],  9,   ["a"],
+ "b",  3,   2,   5,
+ 3,   2,   5,   3,
+  [2],    5,      4,      5,
+  [ 3, 2, 1 ],  1,      2,      3,
+  [ -1, -2, -3 ], [ -1, -2, -3 ], [ -1, -2, -3 ], [ -1, -2 ],
+  3,      [ -1, -2 ],   3,      [ -1, -2, -3 ],
+  [ !1 ],   [ 8, 7, 6 ],  [ 8, 7, 6 ],  [4],
+  !!0,
+];
diff --git a/t/snippets13.t b/t/snippets13.t
index 257c1e4a..a98e59b2 100644
--- a/t/snippets13.t
+++ b/t/snippets13.t
@@ -149,7 +149,7 @@ my $p    = TAP::Parser::SubclassTest->new(
 ----------
 
         'align25' => <<'----------',
-# do not align commas here; different container types
+# do not align internal commas here; different container types
 is_deeply( [ $a,        $a ], [ $b,               $c ] );
 is_deeply( { foo => $a, bar => $a }, { foo => $b, bar => $c } );
 is_deeply( [ \$a,       \$a ], [ \$b,             \$c ] );
@@ -393,10 +393,10 @@ my $p = TAP::Parser::SubclassTest->new(
             source => "align25",
             params => "def",
             expect => <<'#17...........',
-# do not align commas here; different container types
-is_deeply( [ $a, $a ], [ $b, $c ] );
+# do not align internal commas here; different container types
+is_deeply( [ $a, $a ],               [ $b, $c ] );
 is_deeply( { foo => $a, bar => $a }, { foo => $b, bar => $c } );
-is_deeply( [ \$a, \$a ], [ \$b, \$c ] );
+is_deeply( [ \$a, \$a ],             [ \$b, \$c ] );
 
 #17...........
         },
diff --git a/t/snippets21.t b/t/snippets21.t
index 40b8ed61..77c4485b 100644
--- a/t/snippets21.t
+++ b/t/snippets21.t
@@ -89,6 +89,25 @@ $_SetCommState = ff( "k32", "SetCommState", [ N, P ],                I );
 $_SetupComm    = ff( "k32", "SetupComm",    [ N, N, N ],             I );
 $_PurgeComm    = ff( "k32", "PurgeComm",    [ N, N ],                I );
 $_CreateEvent  = ff( "k32", "CreateEvent",  [ P, I, I, P ],          N );
+
+
+is_deeply \@t, [
+
+ [3],  [0],  [1],  [0],
+ 3,   [1],  3,   [1],
+ 2,   [0],  [1],  [0],
+ [1],  [1],  [1],  2,
+ 3,   [1],  2,   [3],
+ 4,   [ 7, 8 ],  9,   ["a"],
+ "b",  3,   2,   5,
+ 3,   2,   5,   3,
+  [2],    5,      4,      5,
+  [ 3, 2, 1 ],  1,      2,      3,
+  [ -1, -2, -3 ], [ -1, -2, -3 ], [ -1, -2, -3 ], [ -1, -2 ],
+  3,      [ -1, -2 ],   3,      [ -1, -2, -3 ],
+  [ !1 ],   [ 8, 7, 6 ],  [ 8, 7, 6 ],  [4],
+  !!0,
+];
 ----------
 
         'sot' => <<'----------',
@@ -320,6 +339,24 @@ $_SetCommState = ff( "k32", "SetCommState", [ N, P ],                I );
 $_SetupComm    = ff( "k32", "SetupComm",    [ N, N, N ],             I );
 $_PurgeComm    = ff( "k32", "PurgeComm",    [ N, N ],                I );
 $_CreateEvent  = ff( "k32", "CreateEvent",  [ P, I, I, P ],          N );
+
+is_deeply \@t, [
+
+    [3],            [0],            [1],            [0],
+    3,              [1],            3,              [1],
+    2,              [0],            [1],            [0],
+    [1],            [1],            [1],            2,
+    3,              [1],            2,              [3],
+    4,              [ 7, 8 ],       9,              ["a"],
+    "b",            3,              2,              5,
+    3,              2,              5,              3,
+    [2],            5,              4,              5,
+    [ 3, 2, 1 ],    1,              2,              3,
+    [ -1, -2, -3 ], [ -1, -2, -3 ], [ -1, -2, -3 ], [ -1, -2 ],
+    3,              [ -1, -2 ],     3,              [ -1, -2, -3 ],
+    [ !1 ],         [ 8, 7, 6 ],    [ 8, 7, 6 ],    [4],
+    !!0,
+];
 #6...........
         },
     };