From 77e7b3548eda07722ba4a123603148ce4edf7091 Mon Sep 17 00:00:00 2001 From: Alexander Foremny Date: Fri, 22 Dec 2023 07:11:54 +0100 Subject: fix: fix tesseract call --- app/Main.hs | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/app/Main.hs b/app/Main.hs index 8803f8b..05b066e 100644 --- a/app/Main.hs +++ b/app/Main.hs @@ -458,7 +458,8 @@ ocr input = ocr1 :: FilePath -> FilePath -> IO T.Text ocr1 tmp input = T.decodeUtf8 . LB.toStrict - <$> sh (printf "tesseract '%s' -" (tmp input)) + -- XXX `--oem 1` seems to be unavailable + <$> sh (printf "tesseract '%s' - -l deu+eng --oem 3 --psm 1" (tmp input)) data Index = Index { originalText :: T.Text, -- cgit v1.2.3