Author: viric
Date: Sun Apr 24 20:01:19 2011
New Revision: 26956
URL: https://svn.nixos.org/websvn/nix/?rev=26956&sc=1
Log:
Adding training results files for some languages to tesseract to be able to do
OCR directly.
Modified:
nixpkgs/trunk/pkgs/applications/graphics/tesseract/default.nix
Modified: nixpkgs/trunk/pkgs/applications/graphics/tesseract/default.nix
==============================================================================
--- nixpkgs/trunk/pkgs/applications/graphics/tesseract/default.nix Sun Apr
24 19:44:36 2011 (r26955)
+++ nixpkgs/trunk/pkgs/applications/graphics/tesseract/default.nix Sun Apr
24 20:01:19 2011 (r26956)
@@ -1,5 +1,22 @@
{ stdenv, fetchurl, libtiff }:
+let
+ f = lang : sha256 : let
+ src = fetchurl {
+ url =
"http://tesseract-ocr.googlecode.com/files/${lang}.traineddata.gz";
+ inherit sha256;
+ };
+ in
+ "gunzip -c ${src} > $out/share/tessdata/${lang}.traineddata";
+
+ extraLanguages = ''
+ ${f "cat" "1qndk8qygw9bq7nzn7kzgxkm3jhlq7jgvdqpj5id4rrcaavjvifw"}
+ ${f "rus" "0yjzks189bgcmi2vr4v0l0fla11qdrw3cb1nvpxl9mdis8qr9vcc"}
+ ${f "spa" "1q1hw3qi95q5ww3l02fbhjqacxm34cp65fkbx10wjdcg0s5p9q2x"}
+ ${f "nld" "0cbqfhl2rwb1mg4y1140nw2vhhcilc0nk7bfbnxw6bzj1y5n49i8"}
+ '';
+in
+
stdenv.mkDerivation {
name = "tesseract-3.0.0";
@@ -10,6 +27,8 @@
buildInputs = [ libtiff ];
+ postInstall = extraLanguages;
+
meta = {
description = "OCR engine";
homepage = http://code.google.com/p/tesseract-ocr/;
_______________________________________________
nix-commits mailing list
[email protected]
http://mail.cs.uu.nl/mailman/listinfo/nix-commits