| my($file) = @_; | my($file) = @_; | ||||
| my $txt = ''; | my $txt = ''; | ||||
| open(OCR,"tesseract -l eng+deu+fra+ita %s - |", $file)); | |||||
| open(OCR,sprintf("tesseract -l eng+deu+fra+ita %s - |", $file)); | |||||
| while(<OCR>) { | while(<OCR>) { | ||||
| $txt .= $_; | $txt .= $_; | ||||
| } | } | ||||
| close(OCR); | close(OCR); | ||||
| return $txt; | return $txt; | ||||
| } | } | ||||
| sub create_page_words { | sub create_page_words { |