106 lines
2.3 KiB
Nix
106 lines
2.3 KiB
Nix
{
|
|
lib,
|
|
buildPythonPackage,
|
|
fetchFromGitHub,
|
|
|
|
# build-system
|
|
setuptools,
|
|
|
|
# dependencies
|
|
numpy,
|
|
scikit-learn,
|
|
termcolor,
|
|
tqdm,
|
|
pandas,
|
|
|
|
# tests
|
|
cleanvision,
|
|
datasets,
|
|
fasttext,
|
|
hypothesis,
|
|
keras,
|
|
matplotlib,
|
|
pytestCheckHook,
|
|
pytest-lazy-fixture,
|
|
skorch,
|
|
tensorflow,
|
|
torch,
|
|
torchvision,
|
|
wget,
|
|
pythonAtLeast,
|
|
}:
|
|
|
|
buildPythonPackage rec {
|
|
pname = "cleanlab";
|
|
version = "2.7.0";
|
|
pyproject = true;
|
|
|
|
src = fetchFromGitHub {
|
|
owner = "cleanlab";
|
|
repo = "cleanlab";
|
|
rev = "refs/tags/v${version}";
|
|
hash = "sha256-0kCEIHNOXIkdwDH5zCVWnR/W79ppc/1PFsJ/a4goGzk=";
|
|
};
|
|
|
|
build-system = [ setuptools ];
|
|
|
|
dependencies = [
|
|
numpy
|
|
scikit-learn
|
|
termcolor
|
|
tqdm
|
|
pandas
|
|
];
|
|
|
|
# This is ONLY turned off when we have testing enabled.
|
|
# The reason we do this is because of duplicate packages in the enclosure
|
|
# when using the packages in nativeCheckInputs.
|
|
# Affected packages: grpcio protobuf tensorboard tensorboard-plugin-profile
|
|
catchConflicts = (!doCheck);
|
|
doCheck = true;
|
|
|
|
nativeCheckInputs = [
|
|
cleanvision
|
|
datasets
|
|
fasttext
|
|
hypothesis
|
|
keras
|
|
matplotlib
|
|
pytestCheckHook
|
|
pytest-lazy-fixture
|
|
skorch
|
|
tensorflow
|
|
torch
|
|
torchvision
|
|
wget
|
|
];
|
|
|
|
disabledTests =
|
|
[
|
|
# Requires the datasets we prevent from downloading
|
|
"test_create_imagelab"
|
|
]
|
|
++ lib.optionals (pythonAtLeast "3.12") [
|
|
# AttributeError: 'called_once_with' is not a valid assertion.
|
|
# Use a spec for the mock if 'called_once_with' is meant to be an attribute..
|
|
# Did you mean: 'assert_called_once_with'?
|
|
"test_custom_issue_manager_not_registered"
|
|
];
|
|
|
|
disabledTestPaths = [
|
|
# Requires internet
|
|
"tests/test_dataset.py"
|
|
# Requires the datasets we just prevented from downloading
|
|
"tests/datalab/test_cleanvision_integration.py"
|
|
# Fails because of issues with the keras derivation
|
|
"tests/test_frameworks.py"
|
|
];
|
|
|
|
meta = {
|
|
description = "Standard data-centric AI package for data quality and machine learning with messy, real-world data and labels";
|
|
homepage = "https://github.com/cleanlab/cleanlab";
|
|
changelog = "https://github.com/cleanlab/cleanlab/releases/tag/v${version}";
|
|
license = lib.licenses.agpl3Only;
|
|
maintainers = with lib.maintainers; [ happysalada ];
|
|
};
|
|
}
|