Author: viric Date: Sun Apr 24 20:01:19 2011 New Revision: 26956 URL: https://svn.nixos.org/websvn/nix/?rev=26956&sc=1
Log: Adding training results files for some languages to tesseract to be able to do OCR directly. Modified: nixpkgs/trunk/pkgs/applications/graphics/tesseract/default.nix Modified: nixpkgs/trunk/pkgs/applications/graphics/tesseract/default.nix ============================================================================== --- nixpkgs/trunk/pkgs/applications/graphics/tesseract/default.nix Sun Apr 24 19:44:36 2011 (r26955) +++ nixpkgs/trunk/pkgs/applications/graphics/tesseract/default.nix Sun Apr 24 20:01:19 2011 (r26956) @@ -1,5 +1,22 @@ { stdenv, fetchurl, libtiff }: +let + f = lang : sha256 : let + src = fetchurl { + url = "http://tesseract-ocr.googlecode.com/files/${lang}.traineddata.gz"; + inherit sha256; + }; + in + "gunzip -c ${src} > $out/share/tessdata/${lang}.traineddata"; + + extraLanguages = '' + ${f "cat" "1qndk8qygw9bq7nzn7kzgxkm3jhlq7jgvdqpj5id4rrcaavjvifw"} + ${f "rus" "0yjzks189bgcmi2vr4v0l0fla11qdrw3cb1nvpxl9mdis8qr9vcc"} + ${f "spa" "1q1hw3qi95q5ww3l02fbhjqacxm34cp65fkbx10wjdcg0s5p9q2x"} + ${f "nld" "0cbqfhl2rwb1mg4y1140nw2vhhcilc0nk7bfbnxw6bzj1y5n49i8"} + ''; +in + stdenv.mkDerivation { name = "tesseract-3.0.0"; @@ -10,6 +27,8 @@ buildInputs = [ libtiff ]; + postInstall = extraLanguages; + meta = { description = "OCR engine"; homepage = http://code.google.com/p/tesseract-ocr/; _______________________________________________ nix-commits mailing list nix-comm...@cs.uu.nl http://mail.cs.uu.nl/mailman/listinfo/nix-commits