Make convert_to_utf8 use Text::Iconv and fallback to Encode; move convert_to_utf8...

[debbugs.git] / Debbugs / Common.pm
diff --git a/Debbugs/Common.pm b/Debbugs/Common.pm

index e269ffc84fa69b8f2fe6462cfe24b0ffac98b95c..eb068edbf4bc589a586989fda55b0ba9678fbacb 100644 (file)
--- a/Debbugs/Common.pm
+++ b/Debbugs/Common.pm
@@ -39,23 +39,32 @@ BEGIN{
  
       @EXPORT = ();
       %EXPORT_TAGS = (util   => [qw(getbugcomponent getbuglocation getlocationpath get_hashname),
  
       @EXPORT = ();
       %EXPORT_TAGS = (util   => [qw(getbugcomponent getbuglocation getlocationpath get_hashname),
-                               qw(appendfile buglog getparsedaddrs getmaintainers),
+                               qw(appendfile overwritefile buglog getparsedaddrs getmaintainers),
+                               qw(bug_status),
                                 qw(getmaintainers_reverse),
                                 qw(getpseudodesc),
                                 qw(getmaintainers_reverse),
                                 qw(getpseudodesc),
+                               qw(package_maintainer),
+                               qw(sort_versions),
                                ],
                                ],
-                    misc   => [qw(make_list globify_scalar english_join)],
+                    misc   => [qw(make_list globify_scalar english_join checkpid),
+                               qw(cleanup_eval_fail),
+                               qw(hash_slice),
+                              ],
+                    utf8   => [qw(encode_utf8_structure encode_utf8_safely),
+                                qw(convert_to_utf8)],
                      date   => [qw(secs_to_english)],
                      quit   => [qw(quit)],
                      lock   => [qw(filelock unfilelock lockpid)],
                     );
       @EXPORT_OK = ();
                      date   => [qw(secs_to_english)],
                      quit   => [qw(quit)],
                      lock   => [qw(filelock unfilelock lockpid)],
                     );
       @EXPORT_OK = ();
-     Exporter::export_ok_tags(qw(lock quit date util misc));
+     Exporter::export_ok_tags(keys %EXPORT_TAGS);
       $EXPORT_TAGS{all} = [@EXPORT_OK];
  }
  
  #use Debbugs::Config qw(:globals);
  
  use Carp;
       $EXPORT_TAGS{all} = [@EXPORT_OK];
  }
  
  #use Debbugs::Config qw(:globals);
  
  use Carp;
+$Carp::Verbose = 1;
  
  use Debbugs::Config qw(:config);
  use IO::File;
  
  use Debbugs::Config qw(:config);
  use IO::File;
@@ -63,8 +72,13 @@ use IO::Scalar;
  use Debbugs::MIME qw(decode_rfc1522);
  use Mail::Address;
  use Cwd qw(cwd);
  use Debbugs::MIME qw(decode_rfc1522);
  use Mail::Address;
  use Cwd qw(cwd);
+use Encode qw(encode_utf8 is_utf8 decode);
+use Text::Iconv;
+use Storable qw(dclone);
+
+use Params::Validate qw(validate_with :types);
  
  
-use Fcntl qw(:flock);
+use Fcntl qw(:DEFAULT :flock);
  
  our $DEBUG_FH = \*STDERR if not defined $DEBUG_FH;
  
  
  our $DEBUG_FH = \*STDERR if not defined $DEBUG_FH;
  
@@ -162,6 +176,8 @@ sub get_hashname {
  
  Returns the path to the logfile corresponding to the bug.
  
  
  Returns the path to the logfile corresponding to the bug.
  
+Returns undef if the bug does not exist.
+
  =cut
  
  sub buglog {
  =cut
  
  sub buglog {
@@ -169,9 +185,27 @@ sub buglog {
      my $location = getbuglocation($bugnum, 'log');
      return getbugcomponent($bugnum, 'log', $location) if ($location);
      $location = getbuglocation($bugnum, 'log.gz');
      my $location = getbuglocation($bugnum, 'log');
      return getbugcomponent($bugnum, 'log', $location) if ($location);
      $location = getbuglocation($bugnum, 'log.gz');
-    return getbugcomponent($bugnum, 'log.gz', $location);
+    return getbugcomponent($bugnum, 'log.gz', $location) if ($location);
+    return undef;
  }
  
  }
  
+=head2 bug_status
+
+     bug_status($bugnum)
+
+
+Returns the path to the summary file corresponding to the bug.
+
+Returns undef if the bug does not exist.
+
+=cut
+
+sub bug_status{
+    my ($bugnum) = @_;
+    my $location = getbuglocation($bugnum, 'summary');
+    return getbugcomponent($bugnum, 'summary', $location) if ($location);
+    return undef;
+}
  
  =head2 appendfile
  
  
  =head2 appendfile
  
@@ -189,6 +223,28 @@ sub appendfile {
         close $fh or die "Unable to close $file: $!";
  }
  
         close $fh or die "Unable to close $file: $!";
  }
  
+=head2 overwritefile
+
+     ovewritefile($file,'data','to','append');
+
+Opens file.new, writes data to it, then moves file.new to file.
+
+=cut
+
+sub overwritefile {
+       my ($file,@data) = @_;
+       my $fh = IO::File->new("${file}.new",'w') or
+            die "Unable top open ${file}.new for writing: $!";
+       print {$fh} @data or die "Unable to write to ${file}.new: $!";
+       close $fh or die "Unable to close ${file}.new: $!";
+       rename("${file}.new",$file) or
+           die "Unable to rename ${file}.new to $file: $!";
+}
+
+
+
+
+
  =head2 getparsedaddrs
  
       my $address = getparsedaddrs($address);
  =head2 getparsedaddrs
  
       my $address = getparsedaddrs($address);
@@ -223,29 +279,11 @@ Returns a hashref of package => maintainer pairs.
  
  =cut
  
  
  =cut
  
-our $_maintainer;
-our $_maintainer_rev;
+our $_maintainer = undef;
+our $_maintainer_rev = undef;
  sub getmaintainers {
  sub getmaintainers {
-    return $_maintainer if $_maintainer;
-    my %maintainer;
-    my %maintainer_rev;
-    for my $file (@config{qw(maintainer_file maintainer_file_override pseduo_maint_file)}) {
-        next unless defined $file;
-        my $maintfile = IO::File->new($file,'r') or
-             die "Unable to open maintainer file $file: $!";
-        while(<$maintfile>) {
-             next unless m/^(\S+)\s+(\S.*\S)\s*$/;
-             ($a,$b)=($1,$2);
-             $a =~ y/A-Z/a-z/;
-             $maintainer{$a}= $b;
-             for my $maint (map {lc($_->address)} getparsedaddrs($b)) {
-                  push @{$maintainer_rev{$maint}},$a;
-             }
-        }
-        close($maintfile);
-    }
-    $_maintainer = \%maintainer;
-    $_maintainer_rev = \%maintainer_rev;
+    return $_maintainer if defined $_maintainer;
+    package_maintainer(rehash => 1);
      return $_maintainer;
  }
  
      return $_maintainer;
  }
  
@@ -258,11 +296,165 @@ Returns a hashref of maintainer => [qw(list of packages)] pairs.
  =cut
  
  sub getmaintainers_reverse{
  =cut
  
  sub getmaintainers_reverse{
-     return $_maintainer_rev if $_maintainer_rev;
-     getmaintainers();
+     return $_maintainer_rev if defined $_maintainer_rev;
+     package_maintainer(rehash => 1);
       return $_maintainer_rev;
  }
  
       return $_maintainer_rev;
  }
  
+=head2 package_maintainer
+
+     my @s = package_maintainer(source => [qw(foo bar baz)],
+                                binary => [qw(bleh blah)],
+                               );
+
+=over
+
+=item source -- scalar or arrayref of source package names to return
+maintainers for, defaults to the empty arrayref.
+
+=item binary -- scalar or arrayref of binary package names to return
+maintainers for; automatically returns source package maintainer if
+the package name starts with 'src:', defaults to the empty arrayref.
+
+=item reverse -- whether to return the source/binary packages a
+maintainer maintains instead
+
+=item rehash -- whether to reread the maintainer and source maintainer
+files; defaults to 0
+
+=back
+
+=cut
+
+our $_source_maintainer = undef;
+our $_source_maintainer_rev = undef;
+sub package_maintainer {
+    my %param = validate_with(params => \@_,
+                             spec   => {source => {type => SCALAR|ARRAYREF,
+                                                   default => [],
+                                                  },
+                                        binary => {type => SCALAR|ARRAYREF,
+                                                   default => [],
+                                                  },
+                                        maintainer => {type => SCALAR|ARRAYREF,
+                                                       default => [],
+                                                      },
+                                        rehash => {type => BOOLEAN,
+                                                   default => 0,
+                                                  },
+                                        reverse => {type => BOOLEAN,
+                                                    default => 0,
+                                                   },
+                                       },
+                            );
+    my @binary = make_list($param{binary});
+    my @source = make_list($param{source});
+    my @maintainers = make_list($param{maintainer});
+    if ((@binary or @source) and @maintainers) {
+       croak "It is nonsensical to pass both maintainers and source or binary";
+    }
+    if ($param{rehash}) {
+       $_source_maintainer = undef;
+       $_source_maintainer_rev = undef;
+       $_maintainer = undef;
+       $_maintainer_rev = undef;
+    }
+    if (not defined $_source_maintainer or
+       not defined $_source_maintainer_rev) {
+       $_source_maintainer = {};
+       $_source_maintainer_rev = {};
+       for my $fn (@config{('source_maintainer_file',
+                            'source_maintainer_file_override',
+                            'pseudo_maint_file')}) {
+           next unless defined $fn;
+           if (not -e $fn) {
+               warn "Missing source maintainer file '$fn'";
+               next;
+           }
+           __add_to_hash($fn,$_source_maintainer,
+                         $_source_maintainer_rev);
+       }
+    }
+    if (not defined $_maintainer or
+       not defined $_maintainer_rev) {
+       $_maintainer = {};
+       $_maintainer_rev = {};
+       for my $fn (@config{('maintainer_file',
+                            'maintainer_file_override',
+                            'pseudo_maint_file')}) {
+           next unless defined $fn;
+           if (not -e $fn) {
+               warn "Missing maintainer file '$fn'";
+               next;
+           }
+           __add_to_hash($fn,$_maintainer,
+                             $_maintainer_rev);
+       }
+    }
+    my @return;
+    for my $binary (@binary) {
+       if (not $param{reverse} and $binary =~ /^src:/) {
+           push @source,$binary;
+           next;
+       }
+       push @return,grep {defined $_} make_list($_maintainer->{$binary});
+    }
+    for my $source (@source) {
+       $source =~ s/^src://;
+       push @return,grep {defined $_} make_list($_source_maintainer->{$source});
+    }
+    for my $maintainer (grep {defined $_} @maintainers) {
+       push @return,grep {defined $_}
+           make_list($_maintainer_rev->{$maintainer});
+       push @return,map {$_ !~ /^src:/?'src:'.$_:$_} 
+           grep {defined $_}
+               make_list($_source_maintainer_rev->{$maintainer});
+    }
+    return @return;
+}
+
+#=head2 __add_to_hash
+#
+#     __add_to_hash($file,$forward_hash,$reverse_hash,'address');
+#
+# Reads a maintainer/source maintainer/pseudo desc file and adds the
+# maintainers from it to the forward and reverse hashref; assumes that
+# the forward is unique; makes no assumptions of the reverse.
+#
+#=cut
+
+sub __add_to_hash {
+    my ($fn,$forward,$reverse,$type) = @_;
+    if (ref($forward) ne 'HASH') {
+       croak "__add_to_hash must be passed a hashref for the forward";
+    }
+    if (defined $reverse and not ref($reverse) eq 'HASH') {
+       croak "if reverse is passed to __add_to_hash, it must be a hashref";
+    }
+    $type //= 'address';
+    my $fh = IO::File->new($fn,'r') or
+       die "Unable to open $fn for reading: $!";
+    binmode($fh,':encoding(UTF-8)');
+    while (<$fh>) {
+       chomp;
+       next unless m/^(\S+)\s+(\S.*\S)\s*$/;
+       my ($key,$value)=($1,$2);
+       $key = lc $key;
+       $forward->{$key}= $value;
+       if (defined $reverse) {
+           if ($type eq 'address') {
+               for my $m (map {lc($_->address)} (getparsedaddrs($value))) {
+                   push @{$reverse->{$m}},$key;
+               }
+           }
+           else {
+               push @{$reverse->{$value}}, $key;
+           }
+       }
+    }
+}
+
+
  =head2 getpseudodesc
  
       my $pseudopkgdesc = getpseudodesc(...);
  =head2 getpseudodesc
  
       my $pseudopkgdesc = getpseudodesc(...);
@@ -276,26 +468,42 @@ pseudopackage or not.
  
  =cut
  
  
  =cut
  
-our $_pseudodesc;
+our $_pseudodesc = undef;
  sub getpseudodesc {
  sub getpseudodesc {
-    return $_pseudodesc if $_pseudodesc;
-    my %pseudodesc;
-
-    if (not defined $config{pseudo_desc_file}) {
-        $_pseudodesc = {};
-        return $_pseudodesc;
-    }
-    my $pseudo = IO::File->new($config{pseudo_desc_file},'r')
-        or die "Unable to open $config{pseudo_desc_file}: $!";
-    while(<$pseudo>) {
-       next unless m/^(\S+)\s+(\S.*\S)\s*$/;
-       $pseudodesc{lc $1} = $2;
-    }
-    close($pseudo);
-    $_pseudodesc = \%pseudodesc;
+    return $_pseudodesc if defined $_pseudodesc;
+    $_pseudodesc = {};
+    __add_to_hash($config{pseudo_desc_file},$_pseudodesc) if
+       defined $config{pseudo_desc_file};
      return $_pseudodesc;
  }
  
      return $_pseudodesc;
  }
  
+=head2 sort_versions
+
+     sort_versions('1.0-2','1.1-2');
+
+Sorts versions using AptPkg::Versions::compare if it is available, or
+Debbugs::Versions::Dpkg::vercmp if it isn't.
+
+=cut
+
+our $vercmp;
+BEGIN{
+    use Debbugs::Versions::Dpkg;
+    $vercmp=\&Debbugs::Versions::Dpkg::vercmp;
+
+# eventually we'll use AptPkg:::Version or similar, but the current
+# implementation makes this *super* difficult.
+
+#     eval {
+#      use AptPkg::Version;
+#      $vercmp=\&AptPkg::Version::compare;
+#     };
+}
+
+sub sort_versions{
+    return sort {$vercmp->($a,$b)} @_;
+}
+
  
  =head1 DATE
  
  
  =head1 DATE
  
@@ -330,20 +538,44 @@ These functions are exported with the :lock tag
  
  =head2 filelock
  
  
  =head2 filelock
  
-     filelock
+     filelock($lockfile);
+     filelock($lockfile,$locks);
  
  FLOCKs the passed file. Use unfilelock to unlock it.
  
  
  FLOCKs the passed file. Use unfilelock to unlock it.
  
+Can be passed an optional $locks hashref, which is used to track which
+files are locked (and how many times they have been locked) to allow
+for cooperative locking.
+
  =cut
  
  our @filelocks;
  
  =cut
  
  our @filelocks;
  
+use Carp qw(cluck);
+
  sub filelock {
      # NB - NOT COMPATIBLE WITH `with-lock'
  sub filelock {
      # NB - NOT COMPATIBLE WITH `with-lock'
-    my ($lockfile) = @_;
+    my ($lockfile,$locks) = @_;
      if ($lockfile !~ m{^/}) {
          $lockfile = cwd().'/'.$lockfile;
      }
      if ($lockfile !~ m{^/}) {
          $lockfile = cwd().'/'.$lockfile;
      }
+    # This is only here to allow for relocking bugs inside of
+    # Debbugs::Control. Nothing else should be using it.
+    if (defined $locks and exists $locks->{locks}{$lockfile} and
+       $locks->{locks}{$lockfile} >= 1) {
+       if (exists $locks->{relockable} and
+           exists $locks->{relockable}{$lockfile}) {
+           $locks->{locks}{$lockfile}++;
+           # indicate that the bug for this lockfile needs to be reread
+           $locks->{relockable}{$lockfile} = 1;
+           push @{$locks->{lockorder}},$lockfile;
+           return;
+       }
+       else {
+           use Data::Dumper;
+           confess "Locking already locked file: $lockfile\n".Data::Dumper->Dump([$lockfile,$locks],[qw(lockfile locks)]);
+       }
+    }
      my ($count,$errors);
      $count= 10; $errors= '';
      for (;;) {
      my ($count,$errors);
      $count= 10; $errors= '';
      for (;;) {
@@ -359,13 +591,19 @@ sub filelock {
         }
         if ($fh) {
              push @filelocks, {fh => $fh, file => $lockfile};
         }
         if ($fh) {
              push @filelocks, {fh => $fh, file => $lockfile};
+            if (defined $locks) {
+                $locks->{locks}{$lockfile}++;
+                push @{$locks->{lockorder}},$lockfile;
+            }
              last;
         }
          if (--$count <=0) {
              $errors =~ s/\n+$//;
              last;
         }
          if (--$count <=0) {
              $errors =~ s/\n+$//;
-            die "failed to get lock on $lockfile -- $errors";
+           use Data::Dumper;
+            croak "failed to get lock on $lockfile -- $errors".
+               (defined $locks?Data::Dumper->Dump([$locks],[qw(locks)]):'');
          }
          }
-        sleep 10;
+#        sleep 10;
      }
  }
  
      }
  }
  
@@ -380,6 +618,7 @@ END {
  =head2 unfilelock
  
       unfilelock()
  =head2 unfilelock
  
       unfilelock()
+     unfilelock($locks);
  
  Unlocks the file most recently locked.
  
  
  Unlocks the file most recently locked.
  
@@ -389,10 +628,24 @@ locked with filelock.
  =cut
  
  sub unfilelock {
  =cut
  
  sub unfilelock {
+    my ($locks) = @_;
      if (@filelocks == 0) {
      if (@filelocks == 0) {
-        warn "unfilelock called with no active filelocks!\n";
+        carp "unfilelock called with no active filelocks!\n";
          return;
      }
          return;
      }
+    if (defined $locks and ref($locks) ne 'HASH') {
+       croak "hash not passsed to unfilelock";
+    }
+    if (defined $locks and exists $locks->{lockorder} and
+       @{$locks->{lockorder}} and
+       exists $locks->{locks}{$locks->{lockorder}[-1]}) {
+       my $lockfile = pop @{$locks->{lockorder}};
+       $locks->{locks}{$lockfile}--;
+       if ($locks->{locks}{$lockfile} > 0) {
+           return
+       }
+       delete $locks->{locks}{$lockfile};
+    }
      my %fl = %{pop(@filelocks)};
      flock($fl{fh},LOCK_UN)
          or warn "Unable to unlock lockfile $fl{file}: $!";
      my %fl = %{pop(@filelocks)};
      flock($fl{fh},LOCK_UN)
          or warn "Unable to unlock lockfile $fl{file}: $!";
@@ -417,25 +670,48 @@ Returns 1 on success, false on failure; dies on unusual errors.
  sub lockpid {
       my ($pidfile) = @_;
       if (-e $pidfile) {
  sub lockpid {
       my ($pidfile) = @_;
       if (-e $pidfile) {
-         my $pidfh = IO::File->new($pidfile, 'r') or
-              die "Unable to open pidfile $pidfile: $!";
-         local $/;
-         my $pid = <$pidfh>;
-         ($pid) = $pid =~ /(\d+)/;
-         if (defined $pid and kill(0,$pid)) {
-              return 0;
-         }
-         close $pidfh;
+         my $pid = checkpid($pidfile);
+         die "Unable to read pidfile $pidfile: $!" if not defined $pid;
+         return 0 if $pid != 0;
           unlink $pidfile or
                die "Unable to unlink stale pidfile $pidfile $!";
       }
           unlink $pidfile or
                die "Unable to unlink stale pidfile $pidfile $!";
       }
-     my $pidfh = IO::File->new($pidfile,'w') or
+     my $pidfh = IO::File->new($pidfile,O_CREAT|O_EXCL|O_WRONLY) or
           die "Unable to open $pidfile for writing: $!";
       print {$pidfh} $$ or die "Unable to write to $pidfile $!";
       close $pidfh or die "Unable to close $pidfile $!";
       return 1;
  }
  
           die "Unable to open $pidfile for writing: $!";
       print {$pidfh} $$ or die "Unable to write to $pidfile $!";
       close $pidfh or die "Unable to close $pidfile $!";
       return 1;
  }
  
+=head2 checkpid
+
+     checkpid('/path/to/pidfile');
+
+Checks a pid file and determines if the process listed in the pidfile
+is still running. Returns the pid if it is, 0 if it isn't running, and
+undef if the pidfile doesn't exist or cannot be read.
+
+=cut
+
+sub checkpid{
+     my ($pidfile) = @_;
+     if (-e $pidfile) {
+         my $pidfh = IO::File->new($pidfile, 'r') or
+              return undef;
+         local $/;
+         my $pid = <$pidfh>;
+         close $pidfh;
+         ($pid) = $pid =~ /(\d+)/;
+         if (defined $pid and kill(0,$pid)) {
+              return $pid;
+         }
+         return 0;
+     }
+     else {
+         return undef;
+     }
+}
+
  
  =head1 QUIT
  
  
  =head1 QUIT
  
@@ -480,22 +756,56 @@ sub make_list {
  
  =head2 english_join
  
  
  =head2 english_join
  
-     print english_join(', ',' and ',@list);
+     print english_join(list => \@list);
+     print english_join(\@list);
  
  Joins list properly to make an english phrase.
  
  
  Joins list properly to make an english phrase.
  
+=over
+
+=item normal -- how to separate most values; defaults to ', '
  
  
+=item last -- how to separate the last two values; defaults to ', and '
+
+=item only_two -- how to separate only two values; defaults to ' and '
+
+=item list -- ARRAYREF values to join; if the first argument is an
+ARRAYREF, it's assumed to be the list of values to join
+
+=back
+
+In cases where C<list> is empty, returns ''; when there is only one
+element, returns that element.
  
  =cut
  
  sub english_join {
  
  =cut
  
  sub english_join {
-     my ($normal,$last,@list) = @_;
-     if (@list <= 1) {
-         return @list?$list[0]:();
-     }
-     my $ret = $last . pop(@list);
-     $ret = join($normal,@list) . $ret;
-     return $ret;
+    if (ref $_[0] eq 'ARRAY') {
+       return english_join(list=>$_[0]);
+    }
+    my %param = validate_with(params => \@_,
+                             spec  => {normal => {type => SCALAR,
+                                                  default => ', ',
+                                                 },
+                                       last   => {type => SCALAR,
+                                                  default => ', and ',
+                                                 },
+                                       only_two => {type => SCALAR,
+                                                    default => ' and ',
+                                                   },
+                                       list     => {type => ARRAYREF,
+                                                   },
+                                      },
+                            );
+    my @list = @{$param{list}};
+    if (@list <= 1) {
+       return @list?$list[0]:'';
+    }
+    elsif (@list == 2) {
+       return join($param{only_two},@list);
+    }
+    my $ret = $param{last} . pop(@list);
+    return join($param{normal},@list) . $ret;
  }
  
  
  }
  
  
@@ -519,7 +829,8 @@ sub globify_scalar {
           if (defined ref($scalar)) {
                if (ref($scalar) eq 'SCALAR' and
                    not UNIVERSAL::isa($scalar,'GLOB')) {
           if (defined ref($scalar)) {
                if (ref($scalar) eq 'SCALAR' and
                    not UNIVERSAL::isa($scalar,'GLOB')) {
-                   return IO::Scalar->new($scalar);
+                   open $handle, '>:scalar:utf8', $scalar;
+                   return $handle;
                }
                else {
                     return $scalar;
                }
                else {
                     return $scalar;
@@ -532,9 +843,205 @@ sub globify_scalar {
                carp "Given a non-scalar reference, non-glob to globify_scalar; returning /dev/null handle";
           }
       }
                carp "Given a non-scalar reference, non-glob to globify_scalar; returning /dev/null handle";
           }
       }
-     return IO::File->new('/dev/null','w');
+     return IO::File->new('/dev/null','>:utf8');
  }
  
  }
  
+=head2 cleanup_eval_fail()
+
+     print "Something failed with: ".cleanup_eval_fail($@);
+
+Does various bits of cleanup on the failure message from an eval (or
+any other die message)
+
+Takes at most two options; the first is the actual failure message
+(usually $@ and defaults to $@), the second is the debug level
+(defaults to $DEBUG).
+
+If debug is non-zero, the code at which the failure occured is output.
+
+=cut
+
+sub cleanup_eval_fail {
+    my ($error,$debug) = @_;
+    if (not defined $error or not @_) {
+       $error = $@ // 'unknown reason';
+    }
+    if (@_ <= 1) {
+       $debug = $DEBUG // 0;
+    }
+    $debug = 0 if not defined $debug;
+
+    if ($debug > 0) {
+       return $error;
+    }
+    # ditch the "at foo/bar/baz.pm line 5"
+    $error =~ s/\sat\s\S+\sline\s\d+//;
+    # ditch croak messages
+    $error =~ s/^\t+.+\n?//g;
+    # ditch trailing multiple periods in case there was a cascade of
+    # die messages.
+    $error =~ s/\.+$/\./;
+    return $error;
+}
+
+=head2 hash_slice
+
+     hash_slice(%hash,qw(key1 key2 key3))
+
+For each key, returns matching values and keys of the hash if they exist
+
+=cut
+
+
+# NB: We use prototypes here SPECIFICALLY so that we can be passed a
+# hash without uselessly making a reference to first. DO NOT USE
+# PROTOTYPES USELESSLY ELSEWHERE.
+sub hash_slice(\%@) {
+    my ($hashref,@keys) = @_;
+    return map {exists $hashref->{$_}?($_,$hashref->{$_}):()} @keys;
+}
+
+
+=head1 UTF-8
+
+These functions are exported with the :utf8 tag
+
+=head2 encode_utf8_structure
+
+     %newdata = encode_utf8_structure(%newdata);
+
+Takes a complex data structure and encodes any strings with is_utf8
+set into their constituent octets.
+
+=cut
+
+our $depth = 0;
+sub encode_utf8_structure {
+    ++$depth;
+    my @ret;
+    for my $_ (@_) {
+       if (ref($_) eq 'HASH') {
+           push @ret, {encode_utf8_structure(%{$depth == 1 ? dclone($_):$_})};
+       }
+       elsif (ref($_) eq 'ARRAY') {
+           push @ret, [encode_utf8_structure(@{$depth == 1 ? dclone($_):$_})];
+       }
+       elsif (ref($_)) {
+           # we don't know how to handle non hash or non arrays
+           push @ret,$_;
+       }
+       else {
+           push @ret,encode_utf8_safely($_);
+       }
+    }
+    --$depth;
+    return @ret;
+}
+
+=head2 encode_utf8_safely
+
+     $octets = encode_utf8_safely($string);
+
+Given a $string, returns the octet equivalent of $string if $string is
+in perl's internal encoding; otherwise returns $string.
+
+Silently returns REFs without encoding them. [If you want to deeply
+encode REFs, see encode_utf8_structure.]
+
+=cut
+
+
+sub encode_utf8_safely{
+    my @ret;
+    for my $r (@_) {
+        if (not ref($r) and is_utf8($r)) {
+           $r = encode_utf8($r);
+       }
+       push @ret,$r;
+    }
+    return wantarray ? @ret : (length @_ > 1 ? @ret : $_[0]);
+}
+
+=head2 convert_to_utf8
+
+    $utf8 = convert_to_utf8("text","charset");
+
+=cut
+
+our %iconv_converters;
+
+sub convert_to_utf8 {
+    my ($data,$charset) = @_;
+    if (is_utf8($data)) {
+        return encode_utf8($data);
+    }
+    $charset = uc($charset);
+    if (not defined $iconv_converters{$charset}) {
+        eval {
+            $iconv_converters{$charset} = Text::Iconv->new($charset,"UTF-8") or
+                die "Unable to create converter for '$charset'";
+        };
+        if ($@) {
+            warn $@;
+            # We weren't able to create the converter, so use Encode
+            # instead
+            return __fallback_convert_to_utf8($data,$charset);
+        }
+        # It shouldn't be necessary when converting to UTF8, but lets
+        # allow for transliteration and silent discarding of broken
+        # sequences
+        eval {
+            $iconv_converters{$charset}->set_attr("transliterate");
+            $iconv_converters{$charset}->set_attr("discard_ilseq");
+        };
+        # This shouldn't fail on Debian systems; we're warning here
+        # just in case we've made a mistake above. This warning should
+        # probably be disabled on non-GNU libc systems.
+        warn $@ if $@;
+    }
+    if (not defined $iconv_converters{$charset}) {
+        warn "The converter for $charset wasn't created properly somehow!";
+        return __fallback_convert_to_utf8($data,$charset);
+    }
+    my $converted_data = $iconv_converters{$charset}->convert($data);
+    # if the conversion failed, retval will be undefined or perhaps
+    # -1.
+    if (not defined $iconv_converters{$charset}->retval() or
+        $iconv_converters{$charset}->retval() < 0
+       ) {
+        # Fallback to encode, which will probably also fail.
+        return __fallback_convert_to_utf8($data,$charset);
+    }
+    return $converted_data;
+}
+
+# Bug #61342 et al.
+# we're switching this to return UTF8 octets instead of perl's internal
+# encoding
+sub __Fallback_convert_to_utf8 {
+     my ($data, $charset) = @_;
+     # raw data just gets returned (that's the charset WordDecorder
+     # uses when it doesn't know what to do)
+     return $data if $charset eq 'raw';
+     if (not defined $charset and not is_utf8($data)) {
+         warn ("Undefined charset, and string '$data' is not in perl's internal encoding");
+         return $data;
+     }
+     # lets assume everything that doesn't have a charset is utf8
+     $charset //= 'utf8';
+     my $result;
+     eval {
+        $result = decode($charset,$data) unless is_utf8($data);
+         $result = encode_utf8($result);
+     };
+     if ($@) {
+         warn "Unable to decode charset; '$charset' and '$data': $@";
+         return $data;
+     }
+     return $result;
+}
+
+
  
  1;
  
  
  1;