forked from mirrors/nixpkgs
60 lines
1.5 KiB
Nix
60 lines
1.5 KiB
Nix
{ stdenv, fetchFromGitHub, fetchurl, pythonPackages, curl }:
|
|
|
|
let
|
|
getmodel = name: sha256: {
|
|
inherit name;
|
|
src = fetchurl {
|
|
url = "http://www.tmbdev.net/ocropy/${name}";
|
|
inherit sha256;
|
|
};
|
|
};
|
|
|
|
models = [
|
|
(getmodel "en-default.pyrnn.gz"
|
|
"1xyi3k3p81mfw0491gb1haisazfyi2i18f1wjs1m34ak39qfqjdp")
|
|
(getmodel "fraktur.pyrnn.gz"
|
|
"1wlwvxn91ilgmlri1hj81arl3mbzxc24ycdnkf5icq4hdi4c6y8b")
|
|
];
|
|
|
|
in
|
|
pythonPackages.buildPythonApplication rec {
|
|
pname = "ocropus";
|
|
version = "1.3.3";
|
|
|
|
src = fetchFromGitHub {
|
|
sha256 = "02p1334mic5cfhvpfphfrbim4036yfd8s2zzpwm0xmm829z71nr7";
|
|
rev = "v${version}";
|
|
repo = "ocropy";
|
|
owner = "tmbdev";
|
|
};
|
|
|
|
propagatedBuildInputs = with pythonPackages; [ curl numpy scipy pillow
|
|
matplotlib beautifulsoup4 pygtk lxml ];
|
|
|
|
enableParallelBuilding = true;
|
|
|
|
preConfigure = with stdenv.lib; ''
|
|
${concatStrings (map (x: "cp -R ${x.src} models/`basename ${x.name}`;")
|
|
models)}
|
|
|
|
substituteInPlace ocrolib/common.py --replace /usr/local $out
|
|
substituteInPlace ocrolib/default.py --replace /usr/local $out
|
|
'';
|
|
|
|
doCheck = false; # fails
|
|
checkPhase = ''
|
|
patchShebangs .
|
|
substituteInPlace ./run-test \
|
|
--replace 'ocropus-rpred' 'ocropus-rpred -Q $NIX_BUILD_CORES'
|
|
PATH=".:$PATH" ./run-test
|
|
'';
|
|
|
|
meta = with stdenv.lib; {
|
|
description = "Open source document analysis and OCR system";
|
|
license = licenses.asl20;
|
|
homepage = "https://github.com/tmbdev/ocropy/";
|
|
maintainers = with maintainers; [ domenkozar ];
|
|
platforms = platforms.linux;
|
|
};
|
|
}
|