]> git.donarmstrong.com Git - bin.git/commitdiff
the output file for tesseract is ocr.txt
authorDon Armstrong <don@donarmstrong.com>
Sat, 13 Sep 2014 19:49:26 +0000 (12:49 -0700)
committerDon Armstrong <don@donarmstrong.com>
Sat, 13 Sep 2014 19:49:26 +0000 (12:49 -0700)
make_djvu

index 1a470a5a21a250963759c29625ef3d4b7e8740a5..74fe74e2723bedb02c2218af20c0d2aa5be1c973 100755 (executable)
--- a/make_djvu
+++ b/make_djvu
@@ -85,7 +85,7 @@ for my $tiff (@ARGV) {
     $base_name =~ s/\.[^\.]+$//;
     system('cjb2',$tiff,$base_name.'.djvu');
     system('tesseract',$tiff,$base_name.'.ocr');
-    my $fh = IO::File->new($base_name.'.ocr','r');
+    my $fh = IO::File->new($base_name.'.ocr.txt','r');
     my $wf = IO::File->new($base_name.'.txt','w');
     print {$wf} "(page 0 0 1 1\n";
     if (defined $fh) {
@@ -98,7 +98,7 @@ for my $tiff (@ARGV) {
     }
     print {$wf} ")\n";
     close $wf;
-    unlink($base_name.'.ocr') if -e $base_name.'.ocr';
+    unlink($base_name.'.ocr.txt') if -e $base_name.'.ocr.txt';
     system('djvused',$base_name.'.djvu','-e','select 1; remove-txt','-s');
     system('djvused',$base_name.'.djvu','-e','select 1; set-txt '.$base_name.'.txt','-s');
     unlink($base_name.'.txt') if -e $base_name.'.txt';