From: Don Armstrong Date: Sat, 13 Sep 2014 19:49:26 +0000 (-0700) Subject: the output file for tesseract is ocr.txt X-Git-Url: https://git.donarmstrong.com/?a=commitdiff_plain;h=6ff59b0e5cc6867c77175d1411d7eaa299af38a4;p=bin.git the output file for tesseract is ocr.txt --- diff --git a/make_djvu b/make_djvu index 1a470a5..74fe74e 100755 --- a/make_djvu +++ b/make_djvu @@ -85,7 +85,7 @@ for my $tiff (@ARGV) { $base_name =~ s/\.[^\.]+$//; system('cjb2',$tiff,$base_name.'.djvu'); system('tesseract',$tiff,$base_name.'.ocr'); - my $fh = IO::File->new($base_name.'.ocr','r'); + my $fh = IO::File->new($base_name.'.ocr.txt','r'); my $wf = IO::File->new($base_name.'.txt','w'); print {$wf} "(page 0 0 1 1\n"; if (defined $fh) { @@ -98,7 +98,7 @@ for my $tiff (@ARGV) { } print {$wf} ")\n"; close $wf; - unlink($base_name.'.ocr') if -e $base_name.'.ocr'; + unlink($base_name.'.ocr.txt') if -e $base_name.'.ocr.txt'; system('djvused',$base_name.'.djvu','-e','select 1; remove-txt','-s'); system('djvused',$base_name.'.djvu','-e','select 1; set-txt '.$base_name.'.txt','-s'); unlink($base_name.'.txt') if -e $base_name.'.txt';