131 lines
3.4 KiB
Nix
131 lines
3.4 KiB
Nix
{
|
|
lib,
|
|
buildPythonPackage,
|
|
fetchFromGitHub,
|
|
|
|
fetchzip,
|
|
replaceVars,
|
|
|
|
setuptools,
|
|
pyclipper,
|
|
opencv-python,
|
|
numpy,
|
|
six,
|
|
shapely,
|
|
pyyaml,
|
|
pillow,
|
|
onnxruntime,
|
|
tqdm,
|
|
|
|
pytestCheckHook,
|
|
requests,
|
|
}:
|
|
let
|
|
version = "1.4.1";
|
|
|
|
src = fetchFromGitHub {
|
|
owner = "RapidAI";
|
|
repo = "RapidOCR";
|
|
tag = "v${version}";
|
|
hash = "sha256-6ohh4NSYqJ+i1JRdsKbcJZns07c+roVJ87r0lvBbExU=";
|
|
};
|
|
|
|
models =
|
|
fetchzip {
|
|
url = "https://github.com/RapidAI/RapidOCR/releases/download/v1.1.0/required_for_whl_v1.3.0.zip";
|
|
hash = "sha256-j/0nzyvu/HfNTt5EZ+2Phe5dkyPOdQw/OZTz0yS63aA=";
|
|
stripRoot = false;
|
|
}
|
|
+ "/required_for_whl_v1.3.0/resources/models";
|
|
in
|
|
buildPythonPackage {
|
|
pname = "rapidocr-onnxruntime";
|
|
inherit version src;
|
|
pyproject = true;
|
|
|
|
sourceRoot = "${src.name}/python";
|
|
|
|
# HACK:
|
|
# Upstream uses a very unconventional structure to organize the packages, and we have to coax the
|
|
# existing infrastructure to work with it.
|
|
# See https://github.com/RapidAI/RapidOCR/blob/02829ef986bc2a5c4f33e9c45c9267bcf2d07a1d/.github/workflows/gen_whl_to_pypi_rapidocr_ort.yml#L80-L92
|
|
# for the "intended" way of building this package.
|
|
|
|
# The setup.py supplied by upstream tries to determine the current version by
|
|
# fetching the latest version of the package from PyPI, and then bumping the version number.
|
|
# This is not allowed in the Nix build environment as we do not have internet access,
|
|
# hence we patch that out and get the version from the build environment directly.
|
|
patches = [
|
|
(replaceVars ./setup-py-override-version-checking.patch {
|
|
inherit version;
|
|
})
|
|
];
|
|
|
|
postPatch = ''
|
|
mv setup_onnxruntime.py setup.py
|
|
mkdir -p rapidocr_onnxruntime/models
|
|
|
|
ln -s ${models}/* rapidocr_onnxruntime/models
|
|
|
|
# Magic patch from upstream - what does this even do??
|
|
echo "from .rapidocr_onnxruntime.main import RapidOCR, VisRes" > __init__.py
|
|
'';
|
|
|
|
# Upstream expects the source files to be under rapidocr_onnxruntime/rapidocr_onnxruntime
|
|
# instead of rapidocr_onnxruntime for the wheel to build correctly.
|
|
preBuild = ''
|
|
mkdir rapidocr_onnxruntime_t
|
|
mv rapidocr_onnxruntime rapidocr_onnxruntime_t
|
|
mv rapidocr_onnxruntime_t rapidocr_onnxruntime
|
|
'';
|
|
|
|
# Revert the above hack
|
|
postBuild = ''
|
|
mv rapidocr_onnxruntime rapidocr_onnxruntime_t
|
|
mv rapidocr_onnxruntime_t/* .
|
|
'';
|
|
|
|
build-system = [ setuptools ];
|
|
|
|
dependencies = [
|
|
pyclipper
|
|
opencv-python
|
|
numpy
|
|
six
|
|
shapely
|
|
pyyaml
|
|
pillow
|
|
onnxruntime
|
|
tqdm
|
|
];
|
|
|
|
pythonImportsCheck = [ "rapidocr_onnxruntime" ];
|
|
|
|
nativeCheckInputs = [
|
|
pytestCheckHook
|
|
requests
|
|
];
|
|
|
|
# These are tests for different backends.
|
|
disabledTestPaths = [
|
|
"tests/test_vino.py"
|
|
"tests/test_paddle.py"
|
|
];
|
|
|
|
disabledTests = [
|
|
# Needs Internet access
|
|
"test_long_img"
|
|
];
|
|
|
|
meta = {
|
|
# This seems to be related to https://github.com/microsoft/onnxruntime/issues/10038
|
|
# Also some related issue: https://github.com/NixOS/nixpkgs/pull/319053#issuecomment-2167713362
|
|
badPlatforms = [ "aarch64-linux" ];
|
|
changelog = "https://github.com/RapidAI/RapidOCR/releases/tag/v${version}";
|
|
description = "Cross platform OCR Library based on OnnxRuntime";
|
|
homepage = "https://github.com/RapidAI/RapidOCR";
|
|
license = with lib.licenses; [ asl20 ];
|
|
maintainers = with lib.maintainers; [ pluiedev ];
|
|
mainProgram = "rapidocr_onnxruntime";
|
|
};
|
|
}
|