4c97a1c690c25d4fbd5f968a0030d9b49af0eddf
[bugscan.git] / scanlib.pm
1 #! /usr/bin/perl
2 # vim: ts=4 sw=4 nowrap
3 #
4 # General functions for scanning the BTS-database.
5 # Based on bugscan, written by Richard Braakman <dark@debian.org>,
6 # which was based on an unknown other script.
7 #
8 # Global variables:
9 #   %comments       - map from bugnumber to bug description
10 #   %premature      - list of prematurely closed bugreports
11 #   %exclude        - list of bugreports to exclude from the report
12 #   %maintainer     - map from packagename to maintainer
13 #   %section        - map from packagename to section in the FTP-site
14 #   %packagelist    - map from packagename to bugreports
15 #   %NMU            - map with NMU information
16
17 use lib qw(/org/bugs.debian.org/perl);
18 use LWP::UserAgent;
19 use Debbugs::MIME qw(decode_rfc1522 encode_rfc1522);
20 use Debbugs::Packages;
21 use Debbugs::Versions;
22 use Debbugs::Status;
23 use Fcntl qw(O_RDONLY);
24 use strict;
25 use warnings;
26 require bugcfg;
27 package scanlib;
28
29 our (%comments,%premature,%exclude,%maintainer,%section,%packagelist,%NMU,%debbugssection,%bugs);
30
31 sub readcomments() {
32 # Read bug commentary 
33 # It is in paragraph format, with the first line of each paragraph being
34 # the bug number or package name to which the comment applies.
35 # Prefix a bug number with a * to force it to be listed even if it's closed.
36 # (This deals with prematurely closed bugs)
37
38         my $index;                                      # Bug-number for current comment
39         my $file;                                       # Name of comments-file
40
41         %comments = ();                                 # Initialize our data
42         %premature = ();
43         %exclude = ();
44         $file=shift;
45         open(C, $file) or die "open $file: $!\n";
46         while (<C>) {
47                 chomp;
48                 if (m/^\s*$/) {                         # Check for paragraph-breaks
49                         undef $index;
50                 } elsif (defined $index) {
51                         $comments{$index} .= $_ . "\n";
52                 } else {
53                         if (s/^\*//) {                  # Test & remove initial *
54                                 $premature{$_} = 1;
55                         }
56                         if (s/\s+EXCLUDE\s*//) {        # Test & remove EXCLUDE
57                                 $exclude{$_} = 1;
58                                 next;
59                         }
60                         $index = $_;
61                         $comments{$index} = ''; # New comment, initialize data
62                 }
63         }
64         close(C);
65 }
66
67
68 # Read the list of maintainer 
69 sub readmaintainers() {
70         my $pkg;                                        # Name of package
71         my $mnt;                                        # Maintainer name & email
72
73         open(M, $bugcfg::maintainerlist) or die "open $bugcfg::maintainerlist: $!\n";
74         while (<M>) {
75                 chomp;
76                 m/^(\S+)\s+(\S.*\S)\s*$/ or die "Maintainers: $_ ?";
77                 ($pkg, $mnt) = ($1, $2);
78                 $pkg =~ y/A-Z/a-z/;                     # Normalize package-name. why???
79                 $_=$mnt;
80                 if (not m/</) {
81                         $mnt="$2 <$1>" if ( m/(\S+)\s+\(([^)]+)\)/ );
82                 }
83                 $maintainer{$pkg}= $mnt;
84         }
85         close(M);
86 }
87
88
89 sub readsources() {
90         my $root;                                       # Root of archive we are scanning
91         my $archive;                            # Name of archive we are scanning
92         my $sect;                                       # Name of current section
93
94         $root=shift;
95         $archive=shift;
96         for $sect (@bugcfg::sections) {
97                 open(P, "zcat $root/$sect/source/Sources.gz|")
98                         or die open "open: $sect sourcelist: $!\n";
99                 while (<P>) {
100                         chomp;
101                         next unless m/^Package:\s/;
102                         s/^Package:\s*//;                       # Strip the fieldname
103                         $section{$_} = "$archive/$sect";
104                 }
105                 close (P);
106         }
107 }
108
109 sub readpackages() {
110         my $root;                                       # Root of archive we are scanning
111         my $archive;                            # Name of archive we are scanning
112         my $sect;                                       # Name of current section
113         my $arch;                                       # Name of current architecture
114
115         $root=shift;
116         $archive=shift;
117         for $arch ( @bugcfg::architectures ) {
118                 for $sect ( @bugcfg::sections) {
119                         open(P, "zcat $root/$sect/binary-$arch/Packages.gz|")
120                                 or die "open: $root/$sect/binary-$arch/Packages.gz: $!\n";
121                         while (<P>) {
122                                 chomp;
123                                 next unless m/^Package:\s/;     # We're only interested in the packagenames
124                                 s/^Package:\s*//;                       # Strip the fieldname
125                                 $section{$_} = "$archive/$sect";
126                         }
127                         close(P);
128                 }
129         }
130 }
131
132 sub readdebbugssources() {
133         my $file;
134         my $archive;
135
136         $file=shift;
137         $archive=shift;
138         open(P, $file)
139                 or die "open: $file: $!\n";
140         while (<P>) {
141                 chomp;
142                 my ($host, $bin, $sect, $ver, $src) = split /\s+/;
143                 my $sectname = ($sect =~ /^\Q$archive/) ? $sect : "$archive/$sect";
144                 $debbugssection{$bin} = $sectname;
145                 $debbugssection{$src} = $sectname;
146         }
147         close(P);
148 }
149
150 sub readpseudopackages() {
151         open(P, $bugcfg::pseudolist) or die("open $bugcfg::pseudolist: $!\n");
152         while (<P>) {
153                 chomp;
154                 s/\s.*//;
155                 $section{$_} = "pseudo";
156         }
157         close(P);
158 }
159
160
161 sub scanspool() {
162         my @dirs;
163         my $dir;
164
165         chdir($bugcfg::spooldir) or die "chdir $bugcfg::spooldir: $!\n";
166
167         opendir(DIR, $bugcfg::spooldir) or die "opendir $bugcfg::spooldir: $!\n";
168         @dirs=grep(m/^\d+$/,readdir(DIR));
169         closedir(DIR);
170
171         for $dir (@dirs) {
172                 scanspooldir("$bugcfg::spooldir/$dir");
173         }
174
175 }
176
177 sub scanspooldir() {
178         my ($dir)               = @_;
179         my $f;                  # While we're currently processing
180         my @list;               # List of files to process
181         my $skip;               # Flow control
182         my $walk;               # index variable
183         my $taginfo;    # Tag info
184
185         chdir($dir) or die "chdir $dir: $!\n";
186
187         opendir(DIR, $dir) or die "opendir $dir: $!\n";
188         @list = grep { s/\.summary$// }
189                         grep { m/^\d+\.summary$/ } 
190                         readdir(DIR);
191         closedir(DIR);
192
193         for $f (@list) {
194                 next if $exclude{$f};                   # Check the list of bugs to skip
195         
196                 my $bug = Debbugs::Status::read_bug(summary => "$f.summary");
197                 next if (!defined($bug));
198                 
199                 $skip=1;
200                 for $walk (@bugcfg::priorities) {
201                         $skip=0 if $walk eq $bug->{'severity'};
202                 }
203
204                 my @tags = split(' ', $bug->{'keywords'});
205                 for my $tag (@tags) {
206                         for my $s (@bugcfg::skiptags) {
207                                 $skip=1 if $tag eq $s;
208                         }
209                 }
210                 next if $skip==1;
211         
212                 my %disttags = ();      
213                 $disttags{'oldstable'}    = grep(/^woody$/, @tags);
214                 $disttags{'stable'}       = grep(/^sarge$/, @tags);
215                 $disttags{'testing'}      = grep(/^etch$/, @tags);
216                 $disttags{'unstable'}     = grep(/^sid$/, @tags);
217                 $disttags{'experimental'} = grep(/^experimental$/, @tags);
218
219                 # default according to dondelelcaro 2006-11-11
220                 if (!$disttags{'oldstable'} && !$disttags{'stable'} && !$disttags{'testing'} && !$disttags{'unstable'} && !$disttags{'experimental'}) {
221                         $disttags{'testing'} = 1;
222                         $disttags{'unstable'} = 1;
223                         $disttags{'experimental'} = 1;
224                 }
225
226                 # only bother to check the versioning status for the distributions indicated by the tags 
227                 my $relinfo = "";
228                 for my $dist qw(oldstable stable testing unstable experimental) {
229                         local $SIG{__WARN__} = sub {};
230
231                         next if (!$disttags{$dist});
232
233                         # only check for the archs we care about
234                         my %svhash = ();
235                         for my $arch qw(alpha amd64 arm hppa i386 ia64 mips mipsel powerpc s390 sparc) {
236                                 my @versions = Debbugs::Packages::getversions($bug->{'package'}, $dist, $arch);
237                                 my @sourceversions = Debbugs::Packages::makesourceversions($bug->{'package'}, $arch, @versions);
238
239                                 for my $sv (@sourceversions) {
240                                         $svhash{$sv} = 1;
241                                 }
242                         }
243
244                         my @sourceversions = keys %svhash;
245                         my $presence = Debbugs::Status::bug_presence(bug => $f, status => $bug, sourceversions => \@sourceversions);
246
247                         # ignore bugs that are absent/fixed in this distribution, include everything
248                         # else (that is, "found" which says that the bug is present, and undef, which
249                         # indicates that no versioning information is present and it's not closed
250                         # unversioned)
251                         if (!defined($presence) || ($presence ne 'absent' && $presence ne 'fixed')) {
252                                 $relinfo .= uc(substr($dist, 0, 1));
253                         }
254                 }
255                 
256                 next if $relinfo eq '' and not $premature{$f};
257                 $premature{$f}++ if $relinfo eq '';
258
259                 $taginfo = "[";
260                 $taginfo .= ($bug->{'keywords'} =~ /\bpending\b/        ? "P" : " ");
261                 $taginfo .= ($bug->{'keywords'} =~ /\bpatch\b/          ? "+" : " ");
262                 $taginfo .= ($bug->{'keywords'} =~ /\bhelp\b/           ? "H" : " ");
263                 $taginfo .= ($bug->{'keywords'} =~ /\bmoreinfo\b/       ? "M" : " ");
264                 $taginfo .= ($bug->{'keywords'} =~ /\bunreproducible\b/ ? "R" : " ");
265                 $taginfo .= ($bug->{'keywords'} =~ /\bsecurity\b/       ? "S" : " ");
266                 $taginfo .= ($bug->{'keywords'} =~ /\bupstream\b/       ? "U" : " ");
267                 $taginfo .= ($bug->{'keywords'} =~ /\betch-ignore\b/    ? "I" : " ");
268                 $taginfo .= "]";
269
270                 if (length($bug->{'mergedwith'})) {
271                         my @merged = split(' ', $bug->{'mergedwith'});
272                         next if ($merged[0] < $f);
273                 }
274
275                 for my $package (split /[,\s]+/, $bug->{'package'}) {
276                         $_= $package; y/A-Z/a-z/; $_= $` if m/[^-+._a-z0-9]/;
277                         if (not defined $section{$_}) {
278                                 if (defined $debbugssection{$_}) {
279                                         $relinfo .= "X";
280                                 } else {
281                                         next;   # Skip unavailable packages
282                                 }
283                         }
284
285                         push @{$packagelist{$_}}, $f;
286                 }
287
288                 if ($relinfo eq "") { # or $relinfo eq "U" # confuses e.g. #210306
289                         $relinfo = "";
290                 } else {
291                         $relinfo = " [$relinfo]";
292                 }
293
294                 $bugs{$f} = "$f $taginfo$relinfo " . $bug->{'subject'};
295         }
296 }
297
298
299 sub readstatus() {
300         my $bug;                # Number of current bug
301         my $subject;    # Subject for current bug
302         my $pkg;                # Name of current package
303         my $file;               # Name of statusfile
304         my $sect;               # Section of current package
305         my $mnt;                # Maintainer of current package
306
307         $file=shift;
308         open(P, $file) or die "open $file: $!";
309         while (<P>) {
310                 chomp;
311                 if (m/^[0-9]+ \[/) {
312                         ($bug,$subject)=split(/ /, $_, 2);
313                         $bugs{$bug}=$subject;
314                         push @{$packagelist{$pkg}}, $bug;
315                 } else {
316                         ($pkg,$sect, $mnt)=split(/ /, $_, 3);
317                         next if (!defined($pkg));
318                         $section{$pkg}=$sect;
319                         $maintainer{$pkg}=$mnt;
320                 }
321         }
322         close P;
323 }
324
325
326 sub readNMUstatus() {
327         my $bug;       # Number of current bug
328         my $source;    # Source upload which closes this bug.
329         my $version;   # Version where this bug was closed.
330         my $flag;      # Whether this paragraph has been processed.
331         my ($field, $value);
332
333         for (split /\n/, LWP::UserAgent->new->request(HTTP::Request->new(GET => shift))->content) {
334                 chomp;
335                 if (m/^$/) {
336                         $NMU{$bug} = 1;
337                         $NMU{$bug, "source"} = $source;
338                         $NMU{$bug, "version"} = $version;
339 #                       $comments{$bug} .= "[FIXED] Fixed package $source is in Incoming\n";
340                         $flag = 0;
341                 } else {
342                         ($field, $value) = split(/: /, $_, 2);
343                         $bug = $value if($field =~ /bug/i);
344                         $source = $value if($field =~ /source/i);
345                         $version = $value if($field =~ /version/i);
346                         $flag = 1;
347                 }
348         }
349         if ($flag) {
350                 $NMU{$bug} = 1;
351                 $NMU{$bug, "source"} = $source;
352                 $NMU{$bug, "version"} = $version;
353 #               $comments{$bug} .= "[FIXED] Fixed package $source in in Incoming\n";
354         }
355         close P;
356 }
357
358
359 sub urlsanit {
360         my $url = shift;
361         $url =~ s/%/%25/g;
362         $url =~ s/\+/%2b/g;
363         my %saniarray = ('<','lt', '>','gt', '&','amp', '"','quot');
364         $url =~ s/([<>&"])/\&$saniarray{$1};/g;
365         return $url;
366 }
367
368 sub htmlsanit {
369     my %saniarray = ('<','lt', '>','gt', '&','amp', '"','quot');
370     my $in = shift || "";
371     $in =~ s/([<>&"])/\&$saniarray{$1};/g;
372     return $in;
373 }
374
375 sub wwwnumber() {
376         my $number = shift;             # Number of bug to html-ize
377 #       my $section);                           # Section for the bug
378
379         "<A HREF=\"http://bugs.debian.org/cgi-bin/bugreport.cgi?archive=no&amp;bug=" .
380                 urlsanit($number) . '">' . htmlsanit($number) . '</A>';
381 #       ($section=$number) =~ s/([0-9]{2}).*/$1/;
382 #       "<A HREF=\"${btsURL}/db/$section/$number.html\">$number</A>";
383 }
384
385 sub wwwname() {
386         my $name = shift;                       # Name of package
387
388         "<A HREF=\"http://bugs.debian.org/cgi-bin/pkgreport.cgi?archive=no&amp;pkg=" .
389                 urlsanit($name) . '">' . htmlsanit($name) . '</A>';
390 #       "<A HREF=\"${btsURL}/db/pa/l$name.html\">$name</A>";
391 }
392
393 sub check_worry {
394         my ($status) = @_;
395
396         if ($status =~ m/^\[[^]]*I/ or
397             $status =~ m/ \[[^]]*X/ or
398             ($status =~ m/ \[[^]]*[OSUE]/ and $status !~ m/ \[[^]]*T/)) {
399                 return 0;
400         }
401         return 1;
402 }
403
404 1;