{ lib , buildPythonPackage , fetchFromGitHub # runtime dependencies , layoutparser , python-multipart , huggingface-hub , opencv , onnxruntime , transformers , detectron2 # check inputs , pytestCheckHook , coverage , click , httpx , mypy , pytest-cov , pdf2image }: buildPythonPackage rec { pname = "unstructured-inference"; version = "0.5.7"; format = "setuptools"; src = fetchFromGitHub { owner = "Unstructured-IO"; repo = "unstructured-inference"; rev = "refs/tags/${version}"; hash = "sha256-xlsihi1ZTNgdnSk3H8rMBRi4AAxPKNFqygcIMtM/jE0="; }; postPatch = '' substituteInPlace requirements/base.in \ --replace "opencv-python" "opencv" ''; propagatedBuildInputs = [ layoutparser python-multipart huggingface-hub opencv onnxruntime transformers detectron2 # paddleocr # yolox ] ++ layoutparser.optional-dependencies.layoutmodels ++ layoutparser.optional-dependencies.tesseract; nativeCheckInputs = [ pytestCheckHook coverage click httpx mypy pytest-cov pdf2image huggingface-hub ]; preCheck = '' export HOME=$(mktemp -d) ''; disabledTests = [ # not sure why this fails "test_get_path_oob_move_deeply_nested" "test_get_path_oob_move_nested[False]" # requires yolox "test_yolox" # requires paddleocr "test_table_prediction" ]; disabledTestPaths = [ # network access "test_unstructured_inference/inference/test_layout.py" "test_unstructured_inference/models/test_chippermodel.py" "test_unstructured_inference/models/test_detectron2.py" "test_unstructured_inference/models/test_detectron2onnx.py" # unclear failure "test_unstructured_inference/models/test_donut.py" "test_unstructured_inference/models/test_model.py" "test_unstructured_inference/models/test_tables.py" ]; pythonImportsCheck = [ "unstructured_inference" ]; meta = with lib; { description = ""; homepage = "https://github.com/Unstructured-IO/unstructured-inference"; changelog = "https://github.com/Unstructured-IO/unstructured-inference/blob/${src.rev}/CHANGELOG.md"; license = licenses.asl20; maintainers = with maintainers; [ happysalada ]; }; }