2024-06-05 15:53:02 +00:00
|
|
|
{
|
|
|
|
lib,
|
|
|
|
buildPythonPackage,
|
|
|
|
fetchFromGitHub,
|
|
|
|
html-text,
|
|
|
|
jstyleson,
|
|
|
|
lxml,
|
|
|
|
mf2py,
|
|
|
|
mock,
|
|
|
|
pyrdfa3,
|
|
|
|
pytestCheckHook,
|
|
|
|
pythonOlder,
|
|
|
|
rdflib,
|
|
|
|
setuptools,
|
|
|
|
six,
|
|
|
|
w3lib,
|
2022-10-06 18:32:54 +00:00
|
|
|
}:
|
|
|
|
|
|
|
|
buildPythonPackage rec {
|
|
|
|
pname = "extruct";
|
2024-07-27 06:49:29 +00:00
|
|
|
version = "0.17.0";
|
2024-01-25 14:12:00 +00:00
|
|
|
pyproject = true;
|
|
|
|
|
|
|
|
disabled = pythonOlder "3.8";
|
2022-10-06 18:32:54 +00:00
|
|
|
|
|
|
|
src = fetchFromGitHub {
|
|
|
|
owner = "scrapinghub";
|
|
|
|
repo = "extruct";
|
2024-01-25 14:12:00 +00:00
|
|
|
rev = "refs/tags/v${version}";
|
2024-07-27 06:49:29 +00:00
|
|
|
hash = "sha256-CfhIqbhrZkJ232grhHxrmj4H1/Bq33ZXe8kovSOWSK0=";
|
2022-10-06 18:32:54 +00:00
|
|
|
};
|
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
nativeBuildInputs = [ setuptools ];
|
2022-10-06 18:32:54 +00:00
|
|
|
|
|
|
|
propagatedBuildInputs = [
|
|
|
|
html-text
|
|
|
|
jstyleson
|
|
|
|
lxml
|
|
|
|
mf2py
|
|
|
|
pyrdfa3
|
|
|
|
rdflib
|
|
|
|
six
|
|
|
|
w3lib
|
|
|
|
];
|
|
|
|
|
2023-02-02 18:25:31 +00:00
|
|
|
nativeCheckInputs = [
|
2022-10-06 18:32:54 +00:00
|
|
|
mock
|
|
|
|
pytestCheckHook
|
|
|
|
];
|
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
pythonImportsCheck = [ "extruct" ];
|
2024-01-25 14:12:00 +00:00
|
|
|
|
|
|
|
disabledTests = [
|
|
|
|
# AssertionError: Lists differ
|
|
|
|
"test_microformat"
|
|
|
|
"test_umicroformat"
|
|
|
|
];
|
2022-10-06 18:32:54 +00:00
|
|
|
|
|
|
|
meta = with lib; {
|
|
|
|
description = "Extract embedded metadata from HTML markup";
|
2024-04-21 15:54:59 +00:00
|
|
|
mainProgram = "extruct";
|
2022-10-06 18:32:54 +00:00
|
|
|
homepage = "https://github.com/scrapinghub/extruct";
|
2024-01-25 14:12:00 +00:00
|
|
|
changelog = "https://github.com/scrapinghub/extruct/blob/v${version}/HISTORY.rst";
|
2022-10-06 18:32:54 +00:00
|
|
|
license = licenses.bsd3;
|
|
|
|
maintainers = with maintainers; [ ambroisie ];
|
|
|
|
};
|
|
|
|
}
|