for my $tiff (@ARGV) {
my $base_name = $tiff;
$base_name =~ s/\.[^\.]+$//;
- system('cjb2',$base_name,$base_name.'.djvu');
+ system('cjb2',$tiff,$base_name.'.djvu');
system('tesseract',$tiff,$base_name.'.ocr');
- my $fh = IO::File->new($base_name.'.ocr','r');
+ my $fh = IO::File->new($base_name.'.ocr.txt','r');
my $wf = IO::File->new($base_name.'.txt','w');
print {$wf} "(page 0 0 1 1\n";
if (defined $fh) {
}
print {$wf} ")\n";
close $wf;
- unlink($base_name.'.ocr') if -e $base_name.'.ocr';
- system('dvjused',$base_name.'.djvu','-e','select 1; remove-txt','-s');
- system('dvjused',$base_name.'.djvu','-e','select 1; set-txt '.$base_name.'.txt','-s');
+ unlink($base_name.'.ocr.txt') if -e $base_name.'.ocr.txt';
+ system('djvused',$base_name.'.djvu','-e','select 1; remove-txt','-s');
+ system('djvused',$base_name.'.djvu','-e','select 1; set-txt '.$base_name.'.txt','-s');
unlink($base_name.'.txt') if -e $base_name.'.txt';
push @djvu_files,$base_name.'.djvu';
}