2020-08-29 14:21:08 +02:00
|
|
|
{ stdenv, python37, fetchFromGitHub }:
|
2018-12-14 03:20:17 +01:00
|
|
|
|
2020-08-29 14:21:08 +02:00
|
|
|
let
|
|
|
|
python = python37.override {
|
|
|
|
self = python;
|
|
|
|
packageOverrides = self: super: {
|
|
|
|
tornado = super.tornado_4;
|
|
|
|
};
|
|
|
|
};
|
|
|
|
|
|
|
|
in with python.pkgs; buildPythonApplication rec {
|
2020-06-20 04:26:27 +02:00
|
|
|
version = "2.1.19";
|
2018-12-14 03:20:17 +01:00
|
|
|
name = "grab-site-${version}";
|
|
|
|
|
|
|
|
src = fetchFromGitHub {
|
2019-09-09 01:38:31 +02:00
|
|
|
rev = version;
|
2019-04-29 05:08:53 +02:00
|
|
|
owner = "ArchiveTeam";
|
2018-12-14 03:20:17 +01:00
|
|
|
repo = "grab-site";
|
2020-06-20 04:26:27 +02:00
|
|
|
sha256 = "1v1hnhv5knzdl0kj3574ccwlh171vcb7faddp095ycdmiiybalk4";
|
2018-12-14 03:20:17 +01:00
|
|
|
};
|
|
|
|
|
2020-08-29 14:21:08 +02:00
|
|
|
propagatedBuildInputs = [
|
2018-12-14 03:20:17 +01:00
|
|
|
click ludios_wpull manhole lmdb autobahn fb-re2 websockets cchardet
|
|
|
|
];
|
|
|
|
|
|
|
|
checkPhase = ''
|
|
|
|
export PATH=$PATH:$out/bin
|
|
|
|
bash ./tests/offline-tests
|
|
|
|
'';
|
|
|
|
|
|
|
|
meta = with stdenv.lib; {
|
|
|
|
description = "Crawler for web archiving with WARC output";
|
2020-04-01 03:11:51 +02:00
|
|
|
homepage = "https://github.com/ArchiveTeam/grab-site";
|
2018-12-14 03:20:17 +01:00
|
|
|
license = licenses.mit;
|
|
|
|
maintainers = with maintainers; [ ivan ];
|
|
|
|
platforms = platforms.all;
|
|
|
|
};
|
|
|
|
}
|