2018-12-14 02:20:17 +00:00
|
|
|
{ stdenv, python3Packages, fetchFromGitHub }:
|
|
|
|
|
|
|
|
python3Packages.buildPythonApplication rec {
|
2020-06-20 03:26:27 +01:00
|
|
|
version = "2.1.19";
|
2018-12-14 02:20:17 +00:00
|
|
|
name = "grab-site-${version}";
|
|
|
|
|
|
|
|
src = fetchFromGitHub {
|
2019-09-09 00:38:31 +01:00
|
|
|
rev = version;
|
2019-04-29 04:08:53 +01:00
|
|
|
owner = "ArchiveTeam";
|
2018-12-14 02:20:17 +00:00
|
|
|
repo = "grab-site";
|
2020-06-20 03:26:27 +01:00
|
|
|
sha256 = "1v1hnhv5knzdl0kj3574ccwlh171vcb7faddp095ycdmiiybalk4";
|
2018-12-14 02:20:17 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
propagatedBuildInputs = with python3Packages; [
|
|
|
|
click ludios_wpull manhole lmdb autobahn fb-re2 websockets cchardet
|
|
|
|
];
|
|
|
|
|
|
|
|
checkPhase = ''
|
|
|
|
export PATH=$PATH:$out/bin
|
|
|
|
bash ./tests/offline-tests
|
|
|
|
'';
|
|
|
|
|
|
|
|
meta = with stdenv.lib; {
|
|
|
|
description = "Crawler for web archiving with WARC output";
|
2020-04-01 02:11:51 +01:00
|
|
|
homepage = "https://github.com/ArchiveTeam/grab-site";
|
2018-12-14 02:20:17 +00:00
|
|
|
license = licenses.mit;
|
|
|
|
maintainers = with maintainers; [ ivan ];
|
|
|
|
platforms = platforms.all;
|
|
|
|
};
|
|
|
|
}
|