2023-07-15 17:15:38 +00:00
{ lib
, buildPythonPackage
, fetchFromGitHub
, pythonOlder
, tensorboard
, scipy
, tqdm
, scikit-learn
, munkres
, networkx
, torch
, pandas
# test dependencies
, pytestCheckHook
, spacy
, pyspark
, dill
, dask
, spacy_models
} :
let
pname = " s n o r k e l " ;
2024-02-29 20:09:43 +00:00
version = " 0 . 1 0 . 0 " ;
2023-07-15 17:15:38 +00:00
in
buildPythonPackage {
inherit pname version ;
format = " s e t u p t o o l s " ;
disabled = pythonOlder " 3 . 8 " ;
src = fetchFromGitHub {
owner = " s n o r k e l - t e a m " ;
repo = pname ;
2024-02-29 20:09:43 +00:00
rev = " r e f s / t a g s / v ${ version } " ;
hash = " s h a 2 5 6 - 1 D g k M H Y T o i I 3 2 6 6 y C N D 1 b X i u i 8 0 x 8 A a B t t x M 8 3 k J I m w = " ;
2023-07-15 17:15:38 +00:00
} ;
propagatedBuildInputs = [
tensorboard
scipy
tqdm
scikit-learn
munkres
networkx
torch
pandas
] ;
# test fail because of some wrong path references
# things like No such file or directory: '/nix/store/8r9x7xv9nfwmd36ca28a39xaharcjdzj-python3.10-pyspark-3.4.0/lib/python3.10/site-packages/pyspark/./bin/spark-submit'
doCheck = false ;
nativeCheckInputs = [
pytestCheckHook
spacy
pyspark
dill
dask
spacy_models . en_core_web_sm
] ++ dask . optional-dependencies . distributed ;
meta = with lib ; {
description = " A s y s t e m f o r q u i c k l y g e n e r a t i n g t r a i n i n g d a t a w i t h w e a k s u p e r v i s i o n " ;
homepage = " h t t p s : / / g i t h u b . c o m / s n o r k e l - t e a m / s n o r k e l " ;
changelog = " h t t p s : / / g i t h u b . c o m / s n o r k e l / s n o r k e l / r e l e a s e s / t a g / v ${ version } " ;
license = licenses . asl20 ;
maintainers = with maintainers ; [ happysalada ] ;
} ;
}