fa5436e0a7
GitOrigin-RevId: e8057b67ebf307f01bdcc8fba94d94f75039d1f6
104 lines
2.3 KiB
Nix
104 lines
2.3 KiB
Nix
{
|
|
lib,
|
|
buildPythonPackage,
|
|
fetchFromGitHub,
|
|
# runtime dependencies
|
|
layoutparser,
|
|
python-multipart,
|
|
huggingface-hub,
|
|
opencv,
|
|
onnxruntime,
|
|
transformers,
|
|
detectron2,
|
|
paddleocr,
|
|
# check inputs
|
|
pytestCheckHook,
|
|
coverage,
|
|
click,
|
|
httpx,
|
|
mypy,
|
|
pytest-cov,
|
|
pdf2image,
|
|
}:
|
|
|
|
buildPythonPackage rec {
|
|
pname = "unstructured-inference";
|
|
version = "0.7.24";
|
|
format = "setuptools";
|
|
|
|
src = fetchFromGitHub {
|
|
owner = "Unstructured-IO";
|
|
repo = "unstructured-inference";
|
|
rev = "refs/tags/${version}";
|
|
hash = "sha256-AxQHTUgE4CyiinT7HEh6fvbw+uVi7lKUgfOc1KZOezU=";
|
|
};
|
|
|
|
postPatch = ''
|
|
substituteInPlace requirements/base.in \
|
|
--replace "opencv-python" "opencv"
|
|
'';
|
|
|
|
propagatedBuildInputs =
|
|
[
|
|
layoutparser
|
|
python-multipart
|
|
huggingface-hub
|
|
opencv
|
|
onnxruntime
|
|
transformers
|
|
detectron2
|
|
paddleocr
|
|
# yolox
|
|
]
|
|
++ layoutparser.optional-dependencies.layoutmodels ++ layoutparser.optional-dependencies.tesseract;
|
|
|
|
nativeCheckInputs = [
|
|
pytestCheckHook
|
|
coverage
|
|
click
|
|
httpx
|
|
mypy
|
|
pytest-cov
|
|
pdf2image
|
|
huggingface-hub
|
|
];
|
|
|
|
preCheck = ''
|
|
export HOME=$(mktemp -d)
|
|
'';
|
|
|
|
disabledTests = [
|
|
# not sure why this fails
|
|
"test_get_path_oob_move_deeply_nested"
|
|
"test_get_path_oob_move_nested[False]"
|
|
# requires yolox
|
|
"test_yolox"
|
|
];
|
|
|
|
disabledTestPaths = [
|
|
# network access
|
|
"test_unstructured_inference/inference/test_layout.py"
|
|
"test_unstructured_inference/models/test_chippermodel.py"
|
|
"test_unstructured_inference/models/test_detectron2.py"
|
|
"test_unstructured_inference/models/test_detectron2onnx.py"
|
|
# unclear failure
|
|
"test_unstructured_inference/models/test_donut.py"
|
|
"test_unstructured_inference/models/test_model.py"
|
|
"test_unstructured_inference/models/test_tables.py"
|
|
];
|
|
|
|
pythonImportsCheck = [ "unstructured_inference" ];
|
|
|
|
meta = with lib; {
|
|
description = "hosted model inference code for layout parsing models";
|
|
homepage = "https://github.com/Unstructured-IO/unstructured-inference";
|
|
changelog = "https://github.com/Unstructured-IO/unstructured-inference/blob/${src.rev}/CHANGELOG.md";
|
|
license = licenses.asl20;
|
|
maintainers = with maintainers; [ happysalada ];
|
|
platforms = [
|
|
"x86_64-linux"
|
|
"x86_64-darwin"
|
|
"aarch64-darwin"
|
|
];
|
|
};
|
|
}
|