diff options
Diffstat (limited to 'pkgs/applications/graphics/tesseract/default.nix')
-rw-r--r-- | pkgs/applications/graphics/tesseract/default.nix | 39 |
1 files changed, 39 insertions, 0 deletions
diff --git a/pkgs/applications/graphics/tesseract/default.nix b/pkgs/applications/graphics/tesseract/default.nix new file mode 100644 index 000000000000..07a160a2e486 --- /dev/null +++ b/pkgs/applications/graphics/tesseract/default.nix @@ -0,0 +1,39 @@ +{ stdenv, fetchurl, libtiff }: + +let + f = lang : sha256 : let + src = fetchurl { + url = "http://tesseract-ocr.googlecode.com/files/${lang}.traineddata.gz"; + inherit sha256; + }; + in + "gunzip -c ${src} > $out/share/tessdata/${lang}.traineddata"; + + extraLanguages = '' + ${f "cat" "1qndk8qygw9bq7nzn7kzgxkm3jhlq7jgvdqpj5id4rrcaavjvifw"} + ${f "rus" "0yjzks189bgcmi2vr4v0l0fla11qdrw3cb1nvpxl9mdis8qr9vcc"} + ${f "spa" "1q1hw3qi95q5ww3l02fbhjqacxm34cp65fkbx10wjdcg0s5p9q2x"} + ${f "nld" "0cbqfhl2rwb1mg4y1140nw2vhhcilc0nk7bfbnxw6bzj1y5n49i8"} + ''; +in + +stdenv.mkDerivation { + name = "tesseract-3.0.0"; + + src = fetchurl { + url = http://tesseract-ocr.googlecode.com/files/tesseract-3.00.tar.gz; + sha256 = "111r9hy1rcs2ch4kdi9dkzwch3xg38vv379sf3cjpkswkigx8clw"; + }; + + buildInputs = [ libtiff ]; + + postInstall = extraLanguages; + + meta = { + description = "OCR engine"; + homepage = http://code.google.com/p/tesseract-ocr/; + license = "Apache2.0"; + maintainers = with stdenv.lib.maintainers; [viric]; + platforms = with stdenv.lib.platforms; linux; + }; +} |