2021-01-11 07:54:33 +00:00
|
|
|
{ lib, stdenv, python37, fetchFromGitHub }:
|
2020-08-29 13:21:08 +01:00
|
|
|
let
|
|
|
|
python = python37.override {
|
|
|
|
self = python;
|
|
|
|
packageOverrides = self: super: {
|
|
|
|
tornado = super.tornado_4;
|
|
|
|
};
|
|
|
|
};
|
|
|
|
|
2021-01-04 13:59:03 +00:00
|
|
|
in
|
|
|
|
with python.pkgs; buildPythonApplication rec {
|
|
|
|
pname = "grab-site";
|
|
|
|
version = "2.2.0";
|
2018-12-14 02:20:17 +00:00
|
|
|
|
|
|
|
src = fetchFromGitHub {
|
2019-09-09 00:38:31 +01:00
|
|
|
rev = version;
|
2019-04-29 04:08:53 +01:00
|
|
|
owner = "ArchiveTeam";
|
2018-12-14 02:20:17 +00:00
|
|
|
repo = "grab-site";
|
2021-01-04 13:59:03 +00:00
|
|
|
sha256 = "1jxcv9dral6h7vfpfqkp1yif6plj0vspzakymkj8hfl75nh0wpv8";
|
2018-12-14 02:20:17 +00:00
|
|
|
};
|
|
|
|
|
2021-01-04 13:59:03 +00:00
|
|
|
postPatch = ''
|
|
|
|
substituteInPlace setup.py \
|
|
|
|
--replace '"wpull @ https://github.com/ArchiveTeam/ludios_wpull/tarball/master#egg=wpull-3.0.7"' '"wpull"'
|
|
|
|
'';
|
|
|
|
|
2020-08-29 13:21:08 +01:00
|
|
|
propagatedBuildInputs = [
|
2021-01-04 13:59:03 +00:00
|
|
|
click
|
|
|
|
ludios_wpull
|
|
|
|
manhole
|
|
|
|
lmdb
|
|
|
|
autobahn
|
|
|
|
fb-re2
|
|
|
|
websockets
|
|
|
|
cchardet
|
2018-12-14 02:20:17 +00:00
|
|
|
];
|
|
|
|
|
|
|
|
checkPhase = ''
|
|
|
|
export PATH=$PATH:$out/bin
|
|
|
|
bash ./tests/offline-tests
|
|
|
|
'';
|
|
|
|
|
2021-01-11 07:54:33 +00:00
|
|
|
meta = with lib; {
|
2018-12-14 02:20:17 +00:00
|
|
|
description = "Crawler for web archiving with WARC output";
|
2020-04-01 02:11:51 +01:00
|
|
|
homepage = "https://github.com/ArchiveTeam/grab-site";
|
2018-12-14 02:20:17 +00:00
|
|
|
license = licenses.mit;
|
|
|
|
maintainers = with maintainers; [ ivan ];
|
|
|
|
platforms = platforms.all;
|
|
|
|
};
|
|
|
|
}
|