From: Steve Hancock <perltidy@users.sourceforge.net>
Date: Fri, 15 Sep 2023 01:13:51 +0000 (-0700)
Subject: update comments
X-Git-Tag: 20230912.01~4
X-Git-Url: https://git.donarmstrong.com/?a=commitdiff_plain;h=4bc7f969cf1e14df96dc0c69a7ee9f8eb951c678;p=perltidy.git

update comments
---

diff --git a/.perlcriticrc b/.perlcriticrc
index e9a88267..31cce025 100644
--- a/.perlcriticrc
+++ b/.perlcriticrc
@@ -1,23 +1,19 @@
-# Perlcritic is a very useful tool for locating potential code problems.
-# This file customizes it to the specific needs of Perl::Tidy.
+# This file is used for running Perl::Critic on Perl::Tidy modules.  Many of
+# the policies are excellent starting points for new code, but important
+# exceptions often exist which make it impossible to use them as rigid rules.
+
+# I have found the '## no critic' method for locally deactivating specific
+# policies to be far too troublesome to use.  So policies without fine tuning
+# controls have to either be 'on' or 'off'.
 
 # Some useful links:
+# https://metacpan.org/dist/Perl-Critic/view/lib/Perl/Critic/PolicySummary.pod
 # https://manpages.ubuntu.com/manpages/xenial/man1/perlcritic.1p.html
 # https://perlmaven.com/perl-critic
-# https://metacpan.org/dist/Perl-Critic/view/lib/Perl/Critic/PolicySummary.pod
 
 # Example command to run a single policy on single module:
 # perlcritic --single-policy Subroutines::ProhibitSubroutinePrototypes Module.pm
 
-# This file lists the policies which must be adjusted or deactivated for
-# Perl::Tidy.  Many of the policies are excellent starting points for new code,
-# but important exceptions often exist which make it impossible to use them as
-# rigid rules.
-
-# I have found the '## no critic' method for locally deactivating specific
-# policies to be too buggy to use.  So policies without fine tuning controls
-# have to either be 'on' or 'off'.
-
 # severity = 1 gives the most strict checking.
 severity = 1
 
@@ -38,15 +34,15 @@ verbose = %f: [%p] %m at line %l, column %c.\n
 [Subroutines::RequireArgUnpacking]
 short_subroutine_statements = 2
 
-# Completely Disagree: The advantages of 'use constant' greatly outweigh the
-# few disadvantages.  Perl::Tidy relies heavily on constants for efficient and
-# robust coding of array indexes and for compiling out debug code, and to
-# avoid autovivication problems that would occur if hashes were used instead.
+# Disagree: The advantages of 'use constant' greatly outweigh the few
+# disadvantages.  Perl::Tidy relies heavily on constants for efficient and
+# robust coding of array indexes and for compiling out debug code, and to avoid
+# autovivication problems that would occur if hashes were used instead.
 [-ValuesAndExpressions::ProhibitConstantPragma]
 
-# Completely Disagree: adding quotes on here doc terminators causes needless
-# "line noise" in the source code.  Almost always the default works.  Besides,
-# my editor uses color to make it clear if interpolation is in effect.
+# Disagree: adding quotes on here doc terminators causes needless "line noise"
+# in the source code.  Almost always the default works.  Besides, my editor
+# uses color to make it clear if interpolation is in effect.
 [-ValuesAndExpressions::RequireQuotedHeredocTerminator]
 
 # Perlcritic doesn't seem to see that @ARGV in Perl::Tidy actually **is**
@@ -126,7 +122,7 @@ max_characters=250
 [-ValuesAndExpressions::ProhibitNoisyQuotes]
 
 # postfix 'if' is good if it highlights control flow
-# postfix 'unless' is likewise good but must be simple, without negative terms
+# postfix 'unless' is likewise good if simple and without negative terms
 [ControlStructures::ProhibitPostfixControls]
 allow = if unless
 
@@ -160,7 +156,7 @@ allow = if unless
 # As the documentation says, this policy is not for everyone
 [-RegularExpressions::ProhibitEnumeratedClasses]
 
-# Completely Disagree. Double quotes are easier to read than single quotes and
+# Disagree. Double quotes are easier to read than single quotes and
 # allow a uniform style for quotes.  My editor has color coding which indicates
 # interpolation. Double quotes do not increase processing time by any
 # measurable amount.  Using them as default simplfies making editing changes.
@@ -175,8 +171,7 @@ allow = if unless
 # ternary expressions. There is little to be gained by omitting them.
 [-CodeLayout::ProhibitParensWithBuiltins] 
 
-# This is OK if we exclude 'print'. Most of the 'print' statements
-# in perltidy are for error reporting, and it does not help to add
-# more extra error checks on top of them. 
+# Exclude 'print' statements, which are mainly used for debug statements
+# and error reporting.
 [InputOutput::RequireCheckedSyscalls]
 exclude_functions = print
diff --git a/lib/Perl/Tidy/Formatter.pm b/lib/Perl/Tidy/Formatter.pm
index e0f22174..c5a4b241 100644
--- a/lib/Perl/Tidy/Formatter.pm
+++ b/lib/Perl/Tidy/Formatter.pm
@@ -2256,7 +2256,10 @@ EOM
 
 sub initialize_token_break_preferences {
 
-    # implement user break preferences
+    # Initialize these global hashes defining break preferences:
+    # %want_break_before
+    # %break_before_container_types
+
     my $break_after = sub {
         my @toks = @_;
         foreach my $tok (@toks) {
@@ -3785,10 +3788,15 @@ EOM
 
         # Essential whitespace means whitespace which cannot be safely deleted
         # without risking the introduction of a syntax error.
-        # We are given three tokens and their types:
-        # ($tokenl, $typel) is the token to the left of the space in question
-        # ($tokenr, $typer) is the token to the right of the space in question
-        # ($tokenll, $typell) is previous nonblank token to the left of $tokenl
+
+        # Given: three tokens and their types:
+        # ($tokenll, $typell) = previous nonblank token to the left of $tokenl
+        # ($tokenl, $typel)   = the token to the left of the space in question
+        # ($tokenr, $typer)   = the token to the right of the space in question
+
+        # Return:
+        #   true  if whitespace is needed
+        #   false if whitespace may be deleted
         #
         # Note1: This routine should almost never need to be changed.  It is
         # for avoiding syntax problems rather than for formatting.
@@ -3839,6 +3847,11 @@ EOM
         my $token_joined         = $tokenl . $tokenr;
         my $tokenl_is_dash       = $tokenl eq '-';
 
+        #-------------------
+        # Must do full check
+        #-------------------
+
+        # This long logical expression gives the result
         my $result =
 
           # never combine two bare words or numbers
@@ -7692,14 +7705,22 @@ sub set_CODE_type {
     # 'VER' = VERSION statement
     # ''    = ordinary line of code with no restrictions
 
+    #--------------------
+    # Loop over all lines
+    #--------------------
     my $ix_line = -1;
     foreach my $line_of_tokens ( @{$rlines} ) {
         $ix_line++;
         my $line_type = $line_of_tokens->{_line_type};
 
         my $last_CODE_type = $CODE_type;
+
+        # Set default to be ordinary code
         $CODE_type = EMPTY_STRING;
 
+        #-------------------------------------
+        # This is only for lines marked 'CODE'
+        #-------------------------------------
         if ( $line_type ne 'CODE' ) {
             next;
         }
@@ -7716,7 +7737,9 @@ sub set_CODE_type {
             else                { $has_side_comment = 1 }
         }
 
+        #-----------------------------------------------------------
         # Write line verbatim if we are in a formatting skip section
+        #-----------------------------------------------------------
         if ($In_format_skipping_section) {
 
             # Note: extra space appended to comment simplifies pattern matching
@@ -7762,7 +7785,9 @@ sub set_CODE_type {
             next;
         }
 
-        # Check for a continued quote..
+        #----------------------------
+        # Check for a continued quote
+        #----------------------------
         if ( $line_of_tokens->{_starting_in_quote} ) {
 
             # A line which is entirely a quote or pattern must go out
@@ -7777,7 +7802,9 @@ sub set_CODE_type {
             }
         }
 
+        #-------------------------------------------------
         # See if we are entering a formatting skip section
+        #-------------------------------------------------
         if (
             $is_block_comment
 
@@ -7803,13 +7830,17 @@ sub set_CODE_type {
             $jmax--;
         }
 
-        # blank line..
+        #-----------
+        # Blank line
+        #-----------
         if ( $jmax < 0 ) {
             $CODE_type = 'BL';
             next;
         }
 
-        # Handle comments
+        #---------
+        # Comments
+        #---------
         if ($is_block_comment) {
 
             # see if this is a static block comment (starts with ## by default)
@@ -7917,8 +7948,9 @@ sub set_CODE_type {
             }
         }
 
-        # End of comments. Handle a line of normal code:
-
+        #-------------------------
+        # Other special code types
+        #-------------------------
         if ($rOpts_indent_only) {
             $CODE_type = 'IO';
             next;
@@ -8974,6 +9006,12 @@ sub respace_post_loop_ops {
 
     my ($self) = @_;
 
+    # We have just completed the 'respace' operation, in which we have made
+    # a pass through all tokens and set the whitespace between tokens to be
+    # according to user settings.  The new tokens have been placed in the new
+    # token list '$rLL_new'. Now we have to go through this new list and
+    # define some indexes which allow quick access into it.
+
     # Walk backwards through the tokens, making forward links to sequence items.
     if ( @{$rLL_new} ) {
         my $KNEXT;
@@ -9195,11 +9233,11 @@ sub store_token {
     # Store one token during respace operations
     #------------------------------------------
 
-    # Input parameter:
-    #  if defined => reference to a token
-    #  if undef   => make and store a blank space
+    # Optional input parameter: '$item'
+    #  if defined => reference to a token to be stored
+    #  otherwise  => make and store a blank space
 
-    # NOTE: called once per token so coding efficiency is critical.
+    # NOTE: this sub is called once per token so coding efficiency is critical.
 
     # If no arg, then make and store a blank space
     if ( !$item ) {
@@ -11199,12 +11237,18 @@ sub weld_cuddled_blocks {
 } ## end sub weld_cuddled_blocks
 
 sub find_nested_pairs {
-    my $self = shift;
+
+    my ($self) = @_;
 
     # This routine is called once per file to do preliminary work needed for
     # the --weld-nested option.  This information is also needed for adding
     # semicolons.
 
+    # Returns:
+    #   \@nested_pairs = ref to a list in which each item is a ref to
+    #   to the sequence numbers of two nested containers:
+    #        [ $seqno_inner, $seqno_outer ]
+
     my $rLL = $self->[_rLL_];
     return unless ( defined($rLL) && @{$rLL} );
     my $Num = @{$rLL};
@@ -11403,6 +11447,10 @@ sub find_nested_pairs {
         next;
     }
 
+    #------------------------------------
+    # Make the final list of nested pairs
+    #------------------------------------
+
     # The weld routine expects the pairs in order in the form
     #   [$seqno_inner, $seqno_outer]
     # And they must be in the same order as the inner closing tokens
@@ -12997,7 +13045,7 @@ sub break_before_list_opening_containers {
 
     my ($self) = @_;
 
-    # This routine is called once per batch to implement parameters
+    # This routine is called once per batch to implement parameters:
     # --break-before-hash-brace=n and similar -bbx=n flags
     #    and their associated indentation flags:
     # --break-before-hash-brace-and-indent and similar -bbxi=n
@@ -13033,8 +13081,15 @@ sub break_before_list_opening_containers {
         $length_tol *= 2;
     }
 
+    #-------------------------------------------------------
+    # These arrays are used to mark the affected containers:
+    #-------------------------------------------------------
     my $rbreak_before_container_by_seqno = {};
     my $rwant_reduced_ci                 = {};
+
+    #------------------------------
+    # Main loop over all containers
+    #------------------------------
     foreach my $seqno ( keys %{$K_opening_container} ) {
 
         #----------------------------------------------------------------
@@ -13370,9 +13425,13 @@ sub break_before_list_opening_containers {
         $rLL->[$KK]->[_CI_LEVEL_] = $ci if ( $ci >= 0 );
     }
 
+    #------------------
+    # Store the results
+    #------------------
     $self->[_rbreak_before_container_by_seqno_] =
       $rbreak_before_container_by_seqno;
     $self->[_rwant_reduced_ci_] = $rwant_reduced_ci;
+
     return;
 } ## end sub break_before_list_opening_containers
 
@@ -14295,6 +14354,8 @@ sub is_fragile_block_type {
 
         my ( $self, $iline, $K_begin_loop, $K_terminal, $K_last ) = @_;
 
+        # Loop over all tokens on a line for sub xlp_collapse_lengths
+
         my $rLL                 = $self->[_rLL_];
         my $K_closing_container = $self->[_K_closing_container_];
 
@@ -19745,11 +19806,16 @@ EOM
     sub recombine_inner_loop {
         my ( $self, $rhash ) = @_;
 
-        # This is the inner loop of the recombine operation. We look at all of
-        # the remaining joints in this section and select the best joint to be
-        # recombined.  If a recombination is made, the number of lines
-        # in this section will be reduced by one.
+        # This is the inner loop of the recombine operation. We are working on
+        # a sequence of multiple lines. We look at each pair of lines and
+        # decide if formatting would be improved if the pair were joined
+        # into a single line. If there are multiple of such possible
+        # recombinations, we select the best.  If a recombination is made,
+        # the number of lines in this group of lines will be reduced by one.
+        # See comments in the calling routine for further explanation.
 
+        # Input:
+        #    $rhash has parameters controlling this recombine operation
         # Returns: nothing
 
         my $rK_weld_right = $self->[_rK_weld_right_];
@@ -19768,7 +19834,7 @@ EOM
         my $ix_best = 0;
         my $num_bs  = 0;
 
-        # The range of lines in this group is $nbeg to $nstop
+        # The index range of lines in this group is $nbeg to $nstop
         my $nmax       = @{$ri_end} - 1;
         my $nstop      = $nmax - $rhash->{_num_freeze};
         my $num_joints = $nstop - $nbeg;
@@ -20290,7 +20356,9 @@ EOM
         my ( $ri_beg, $ri_end, $n, $this_line_is_semicolon_terminated ) = @_;
 
         # Recombine Section 2:
-        # Examine token at $iend_1 (right end of first line of pair)
+        # We are comparing two lines to see if they should be combined
+        # into a single line. This sub examines the token '$iend_1' in
+        # the following diagram (right end of first line of pair):
 
         # Here are Indexes of the endpoint tokens of the two lines:
         #
@@ -20779,7 +20847,9 @@ EOM
         my ( $ri_beg, $ri_end, $n, $this_line_is_semicolon_terminated ) = @_;
 
         # Recombine Section 3:
-        # Examine token at $ibeg_2 (right end of first line of pair)
+        # We are comparing two lines to see if they should be combined
+        # into a single line. This sub examines the token '$ibeg_2' in
+        # the following diagram (left end of second line of pair):
 
         # Here are Indexes of the endpoint tokens of the two lines:
         #
@@ -23232,9 +23302,11 @@ EOM
 
         #-------------------------------------------
         # END of loop over all tokens in this batch
-        # Now set breaks for any unfinished lists ..
         #-------------------------------------------
 
+        #----------------------------------------
+        # Now set breaks for any unfinished lists
+        #----------------------------------------
         foreach my $dd ( reverse( $minimum_depth .. $current_depth ) ) {
 
             $interrupted_list[$dd]   = 1;
@@ -23264,11 +23336,11 @@ EOM
             }
         } ## end for ( my $dd = $current_depth...)
 
-        #----------------------------------------
-        # Return the flag '$saw_good_breakpoint'.
-        #----------------------------------------
-        # This indicates if the input file had some good breakpoints.  This
-        # flag will be used to force a break in a line shorter than the
+        #------------------------------------------------
+        # Set the return the flag '$saw_good_breakpoint'.
+        #------------------------------------------------
+        # This flag indicates if the input file had some good breakpoints.
+        # It will be used to force a break in a line shorter than the
         # allowed line length.
         if ( $has_old_logical_breakpoints[$current_depth] ) {
             $saw_good_breakpoint = 1;
@@ -24670,6 +24742,7 @@ EOM
         my $interrupted         = $rhash_IN->{interrupted};
         my $rdo_not_break_apart = $rhash_IN->{rdo_not_break_apart};
         my $must_break_open     = $rhash_IN->{must_break_open};
+
 ## NOTE: these input vars from caller use the values from rhash_A (see above):
 ##      my $item_count          = $rhash_IN->{item_count};
 ##      my $identifier_count    = $rhash_IN->{identifier_count};
@@ -26382,6 +26455,10 @@ sub get_available_spaces_to_go {
     sub lp_decreasing_depth {
         my ( $self, $ii ) = @_;
 
+        # This is called by sub set_lp_indentation for a token at index $ii
+        # which has a lower nesting depth compared to the previous token.
+        # We have to update the stack variables for the new indentation.
+
         my $rLL = $self->[_rLL_];
 
         my $level    = $levels_to_go[$ii];
@@ -26493,6 +26570,10 @@ EOM
     sub lp_increasing_depth {
         my ( $self, $ii ) = @_;
 
+        # This is called by sub set_lp_indentation for a token at index $ii
+        # which has an increasing nesting depth compared to the previous token.
+        # We have to update the stack variables for the new indentation.
+
         my $rLL = $self->[_rLL_];
 
         my $type     = $types_to_go[$ii];
@@ -27698,7 +27779,9 @@ EOM
         # $ralignment_type_to_go->[$i] equal to those tokens at which we would
         # accept vertical alignment.
 
-        # Initialize closure (and return) variables:
+        #----------------------------
+        # Initialize return variables
+        #----------------------------
         $ralignment_type_to_go   = [];
         $ralignment_counts       = [];
         $ralignment_hash_by_line = [];
@@ -30226,6 +30309,13 @@ sub make_paren_name {
         # Determine indentation adjustment for a line with a leading closing
         # token - i.e. one of these:     ) ] } :
 
+        # Returns:
+        #   adjust_indentation flag:
+        #       0 - do not adjust
+        #       1 - outdent
+        #       2 - vertically align with opening token
+        #       3 - indent
+
         my (
             $self,    #