587713944a
GitOrigin-RevId: 6143fc5eeb9c4f00163267708e26191d1e918932
71 lines
1.2 KiB
Nix
71 lines
1.2 KiB
Nix
{ lib
|
|
, buildPythonPackage
|
|
, fetchFromGitHub
|
|
, html-text
|
|
, jstyleson
|
|
, lxml
|
|
, mf2py
|
|
, mock
|
|
, pyrdfa3
|
|
, pytestCheckHook
|
|
, pythonOlder
|
|
, pythonRelaxDepsHook
|
|
, rdflib
|
|
, setuptools
|
|
, six
|
|
, w3lib
|
|
}:
|
|
|
|
buildPythonPackage rec {
|
|
pname = "extruct";
|
|
version = "0.16.0";
|
|
pyproject = true;
|
|
|
|
disabled = pythonOlder "3.8";
|
|
|
|
src = fetchFromGitHub {
|
|
owner = "scrapinghub";
|
|
repo = "extruct";
|
|
rev = "refs/tags/v${version}";
|
|
hash = "sha256-6lAb17EoR0FKyIOb9hk1jcpmPtZ7vClfuCrDZ83XBeg=";
|
|
};
|
|
|
|
nativeBuildInputs = [
|
|
setuptools
|
|
];
|
|
|
|
propagatedBuildInputs = [
|
|
html-text
|
|
jstyleson
|
|
lxml
|
|
mf2py
|
|
pyrdfa3
|
|
rdflib
|
|
six
|
|
w3lib
|
|
];
|
|
|
|
nativeCheckInputs = [
|
|
mock
|
|
pytestCheckHook
|
|
];
|
|
|
|
pythonImportsCheck = [
|
|
"extruct"
|
|
];
|
|
|
|
disabledTests = [
|
|
# AssertionError: Lists differ
|
|
"test_microformat"
|
|
"test_umicroformat"
|
|
];
|
|
|
|
meta = with lib; {
|
|
description = "Extract embedded metadata from HTML markup";
|
|
mainProgram = "extruct";
|
|
homepage = "https://github.com/scrapinghub/extruct";
|
|
changelog = "https://github.com/scrapinghub/extruct/blob/v${version}/HISTORY.rst";
|
|
license = licenses.bsd3;
|
|
maintainers = with maintainers; [ ambroisie ];
|
|
};
|
|
}
|