updated to an improved list marking method

author Steve Hancock <perltidy@users.sourceforge.net>

Wed, 23 Dec 2020 22:36:45 +0000 (14:36 -0800)

committer Steve Hancock <perltidy@users.sourceforge.net>

Wed, 23 Dec 2020 22:36:45 +0000 (14:36 -0800)
author Steve Hancock <perltidy@users.sourceforge.net>
Wed, 23 Dec 2020 22:36:45 +0000 (14:36 -0800)
committer Steve Hancock <perltidy@users.sourceforge.net>
Wed, 23 Dec 2020 22:36:45 +0000 (14:36 -0800)
diff --git a/lib/Perl/Tidy.pm b/lib/Perl/Tidy.pm

index f358a0818b3a7780b4405d88688a258c1406d1e1..0ef550910a5d7a5493534d8c7549d8c808d9fdf9 100644 (file)
--- a/lib/Perl/Tidy.pm
+++ b/lib/Perl/Tidy.pm
@@ -1,5 +1,5 @@
  #
-###########################################################-
+###########################################################
  #
  #    perltidy - a perl script indenter and formatter
  #
diff --git a/lib/Perl/Tidy/VerticalAligner.pm b/lib/Perl/Tidy/VerticalAligner.pm

index b8898442b5f7d74c7ede747e6274c46eddc35197..ed0ae56e4ad20f98fa2f152a6f195d8073cfc5de 100644 (file)
--- a/lib/Perl/Tidy/VerticalAligner.pm
+++ b/lib/Perl/Tidy/VerticalAligner.pm
@@ -340,7 +340,7 @@ use constant DEBUG_VALIGN => 0;
  # Flag for use during conversion to using new $list_seqno
  # to identify lists of items.  The flag 'is_forced_break' will
  # be removed when conversion is complete.
-use constant TEST_LIST_SEQNO => 0;
+use constant TEST_OLD_LIST => 0;
  
  sub valign_input {
  
@@ -717,7 +717,7 @@ EOM
      # Decide if this is a simple list of items.
      # We use this to be less restrictive in deciding what to align.
      # --------------------------------------------------------------------
-    if (TEST_LIST_SEQNO) {
+    if ( !TEST_OLD_LIST ) {
          decide_if_list($new_line) if ($list_seqno);
      }
      else {
@@ -1549,6 +1549,11 @@ sub _flush_group_lines {
              my $imax_pair = $line_1->get_imax_pair();
              if ( $imax_pair > $imax_align ) { $imax_align = $imax_pair }
  
+            ## flag for possible future use:
+            ## my $is_isolated_pair = $imax_pair < 0
+            ##  && ( $jbeg == 0
+            ##    || $rall_lines->[ $jbeg - 1 ]->get_imax_pair() < 0 );
+
              my ( $is_marginal, $imax_align_fix ) =
                is_marginal_match( $line_0, $line_1, $grp_level, $imax_align );
              if ($is_marginal) {
@@ -1739,6 +1744,64 @@ EOM
      }
  }
  
+sub two_line_pad {
+
+    my ( $line_m, $line, $imax_min ) = @_;
+
+    # Given:
+    #  two isolated (list) lines
+    #  imax_min = number of common alignment tokens
+    # Return:
+    #  $pad_max = maximum suggested pad distnce
+    #           = 0 if alignment not recommended
+    # Method:
+    # Note that this is only for two lines which do not have alignment tokens
+    # in common with any other lines.  It is intended for lists, but it might
+    # also be used for two non-list lines with a common leading '='.
+
+    # Use a minimum pad distance not less than the minimum of two mean
+    # field lengths.  The idea is to avoid aligning lines with very
+    # different field lengths, like these two:
+    #   [
+    #       'VARCHAR', DBI::SQL_VARCHAR, undef, "'", "'", undef, 0, 1,
+    #       1, 0, 0, 0, undef, 0, 0
+    #   ];
+    my $short_pad        = 4;
+    my $rfield_lengths   = $line->get_rfield_lengths();
+    my $rfield_lengths_m = $line_m->get_rfield_lengths();
+
+    # Safety check
+    my $jmax_m = $line_m->get_jmax();
+    my $jmax   = $line->get_jmax();
+    if ( $imax_min > $jmax_m - 2 ) { $imax_min = $jmax_m - 2 }
+    if ( $imax_min > $jmax - 2 )   { $imax_min = $jmax - 2 }
+
+    my $avg   = 0;
+    my $avg_m = 0;
+    for ( my $i = 0 ; $i <= $imax_min ; $i++ ) {
+        $avg_m += $rfield_lengths_m->[$i];
+        $avg   += $rfield_lengths->[$i];
+    }
+    $avg   /= ( $imax_min + 1 );
+    $avg_m /= ( $imax_min + 1 );
+    my $avg_min = $avg <= $avg_m ? $avg : $avg_m;
+
+    my $pad_max = $short_pad;
+    if ( $pad_max < $avg_min ) { $pad_max = $avg_min }
+    my $pad_first = $rfield_lengths->[0] - $rfield_lengths_m->[0];
+
+    # Usually we allow pads to occur wherever they can go, but for two
+    # list lines we will not align if the first pad is too large. This
+    # can avoid some poor alignments of two lines. For example, this is
+    # not so good:
+    #   [
+    #       0, 'OPpLVREF_SV',    'SV', 1, 'OPpLVREF_AV', 'AV', 2,
+    #       'OPpLVREF_HV', 'HV', 3,    'OPpLVREF_CV', 'CV',
+    #   ];
+    $pad_max = 0 if ( $pad_first < -$pad_max || $pad_first > $pad_max );
+    return $pad_max;
+}
+
  sub sweep_left_to_right {
  
      my ( $rlines, $rgroups, $group_level ) = @_;
@@ -1835,7 +1898,7 @@ sub sweep_left_to_right {
          if (
                 $jend == $jbeg
              && $jend_m == $jbeg_m
-            && !( $list_type && !TEST_LIST_SEQNO )
+            && !( $list_type && TEST_OLD_LIST )
              && ( $ng == 1 || $istop_mm < 0 )
              && ( $ng == $ng_max || $istop < 0 )
              && !$line->get_j_terminal_match()
@@ -1849,16 +1912,20 @@ sub sweep_left_to_right {
          {
  
              # We will just align assignments and simple lists
+            next unless ( $imax_min >= 0 );
              next
-              unless ( $imax_min >= 0 && $rtokens->[0] =~ /^=\d/
-                || ( TEST_LIST_SEQNO && $list_type ) );
+              unless ( $rtokens->[0] =~ /^=\d/
+                || ( !TEST_OLD_LIST && $list_type ) );
  
-            # In this case we will limit padding to one indent distance.  This
+            # In this case we will limit padding to a short distance.  This
              # is a compromise to keep some vertical alignment but prevent large
              # gaps, which do not look good for just two lines.
+            my $pad_max =
+              two_line_pad( $rlines->[$jbeg], $rlines->[$jbeg_m], $imax_min );
+            next unless ($pad_max);
              my $ng_m = $ng - 1;
-            $max_move{"$ng_m"} = $short_pad;
-            $max_move{"$ng"}   = $short_pad;
+            $max_move{"$ng_m"} = $pad_max;
+            $max_move{"$ng"}   = $pad_max;
          }
  
          # Loop to find all common leading tokens.
@@ -3163,7 +3230,7 @@ sub match_line_pairs {
              elsif ( $list_type && $list_type eq $list_type_m ) {
  
                  # do not align lists across a ci jump with new list method
-                if ( TEST_LIST_SEQNO && $ci_jump ) { $imax_min = -1 }
+                if ( !TEST_OLD_LIST && $ci_jump ) { $imax_min = -1 }
  
                  my $i_nomatch = $imax_min + 1;
                  for ( my $i = 0 ; $i <= $imax_min ; $i++ ) {
diff --git a/local-docs/BugLog.pod b/local-docs/BugLog.pod

index 831f31ed5ebe6c1f61a493566f5c7d4c59c8c738..e7ff6522dda9b7e93c4c6fc6e64af91431f8d644 100644 (file)
--- a/local-docs/BugLog.pod
+++ b/local-docs/BugLog.pod
@@ -2,6 +2,49 @@
  
  =over 4
  
+=item B<improve list marking method>
+
+In the process of making vertical alignments, lines which are simple lists of
+items are treated different from other lines. The old method for finding and
+marking these lines had a few problems which are corrected with this update.
+The main problem was that the old method ran into trouble when there were side
+comments.  For example, the old method was not marking the following list and
+as a result the two columns of values were not aligned:
+
+    # OLD
+    return (
+        $startpos, $ldelpos - $startpos,         # PREFIX
+        $ldelpos,  1,                            # OPENING BRACKET
+        $ldelpos + 1, $endpos - $ldelpos - 2,    # CONTENTS
+        $endpos - 1, 1,                          # CLOSING BRACKET
+        $endpos, length($$textref) - $endpos,    # REMAINDER
+    );
+
+    # NEW
+    return (
+        $startpos,    $ldelpos - $startpos,           # PREFIX
+        $ldelpos,     1,                              # OPENING BRACKET
+        $ldelpos + 1, $endpos - $ldelpos - 2,         # CONTENTS
+        $endpos - 1,  1,                              # CLOSING BRACKET
+        $endpos,      length($$textref) - $endpos,    # REMAINDER
+    );
+
+Another problem was that occasionally unwanted alignments were made between
+lines which were not really lists because the lines were incorrectly marked.
+For example (note padding after first comma)
+
+    # OLD: (undesirable alignment)
+    my ( $isig2, $chisq ) = ( 1 / ( $sig * $sig ), 0 );
+    my ( $ym,    $al, $cov, $bet, $olda, $ochisq, $di, $pivt, $info ) =
+      map { null } ( 0 .. 8 );
+
+    # NEW: (no alignment)
+    my ( $isig2, $chisq ) = ( 1 / ( $sig * $sig ), 0 );
+    my ( $ym, $al, $cov, $bet, $olda, $ochisq, $di, $pivt, $info ) =
+      map { null } ( 0 .. 8 );
+
+This update was made 22 Dec 2020.
+
  =item B<Fix git #51, closing quote pattern delimiters not following -cti flag settings>
  
  Closing pattern delimiter tokens of qw quotes were not following the -cti flag
diff --git a/t/snippets/expect/kba1.kba1 b/t/snippets/expect/kba1.kba1

index 453e439cd908da82f8a45ca5f055aa77579db96e..c18f5ea15df5385aebf24e5b14483e7e9c31c254 100644 (file)
--- a/t/snippets/expect/kba1.kba1
+++ b/t/snippets/expect/kba1.kba1
@@ -1,6 +1,6 @@
  $this_env = join(
      "", $before, $closures
-    , $contents
+    ,   $contents
      , ( $defenv ? '' : &balance_tags() )
      , $reopens
  );
diff --git a/t/snippets/expect/style.style1 b/t/snippets/expect/style.style1

index c25402fddaaa36fda9cab8a30c44b15c4ab8b0aa..785d48657156df89543c56838e260575351fb631 100644 (file)
--- a/t/snippets/expect/style.style1
+++ b/t/snippets/expect/style.style1
@@ -1,7 +1,7 @@
  # This test snippet is from package bbbike v3.214 by Slaven Rezic; GPL 2.0 licence
  sub arrange_topframe {
    my (@order) = (
-    $hslabel_frame, $km_frame, $speed_frame[0],
+    $hslabel_frame,  $km_frame,   $speed_frame[0],
      $power_frame[0], $wind_frame, $percent_frame, $temp_frame,
      @speed_frame[1 .. $#speed_frame],
      @power_frame[1 .. $#power_frame],
diff --git a/t/snippets10.t b/t/snippets10.t

index c6f904efea0fedb4b8defbea9a9949dc9ce43fad..302e61485b90d23d07a54c1d68a9fe407b5bb724 100644 (file)
--- a/t/snippets10.t
+++ b/t/snippets10.t
@@ -760,7 +760,7 @@ sub arrange_topframe {
  # This test snippet is from package bbbike v3.214 by Slaven Rezic; GPL 2.0 licence
  sub arrange_topframe {
    my (@order) = (
-    $hslabel_frame, $km_frame, $speed_frame[0],
+    $hslabel_frame,  $km_frame,   $speed_frame[0],
      $power_frame[0], $wind_frame, $percent_frame, $temp_frame,
      @speed_frame[1 .. $#speed_frame],
      @power_frame[1 .. $#power_frame],
diff --git a/t/snippets22.t b/t/snippets22.t

index 12567450e796f90986febd3931d0e8166bdb6962..92563c258b62f8068a3886aed94ba6591889750b 100644 (file)
--- a/t/snippets22.t
+++ b/t/snippets22.t
@@ -628,7 +628,7 @@ method 'foo2' => [ Int, Int ] => sub {
              expect => <<'#16...........',
  $this_env = join(
      "", $before, $closures
-    , $contents
+    ,   $contents
      , ( $defenv ? '' : &balance_tags() )
      , $reopens
  );
author	Steve Hancock <perltidy@users.sourceforge.net>
	Wed, 23 Dec 2020 22:36:45 +0000 (14:36 -0800)
committer	Steve Hancock <perltidy@users.sourceforge.net>
	Wed, 23 Dec 2020 22:36:45 +0000 (14:36 -0800)
lib/Perl/Tidy.pm		patch \| blob \| history
lib/Perl/Tidy/VerticalAligner.pm		patch \| blob \| history
local-docs/BugLog.pod		patch \| blob \| history
t/snippets/expect/kba1.kba1		patch \| blob \| history
t/snippets/expect/style.style1		patch \| blob \| history
t/snippets10.t		patch \| blob \| history
t/snippets22.t		patch \| blob \| history