81 lines
1.3 KiB
Nix
81 lines
1.3 KiB
Nix
{
|
|
lib,
|
|
buildPythonPackage,
|
|
fetchFromGitHub,
|
|
cmake,
|
|
pkg-config,
|
|
cxxopts,
|
|
poetry-core,
|
|
pybind11,
|
|
tabulate,
|
|
zlib,
|
|
nlohmann_json,
|
|
utf8cpp,
|
|
libjpeg,
|
|
qpdf,
|
|
loguru-cpp,
|
|
pytestCheckHook,
|
|
}:
|
|
|
|
buildPythonPackage rec {
|
|
pname = "docling-parse";
|
|
version = "2.0.3";
|
|
pyproject = true;
|
|
|
|
src = fetchFromGitHub {
|
|
owner = "DS4SD";
|
|
repo = "docling-parse";
|
|
rev = "refs/tags/v${version}";
|
|
hash = "sha256-pZJ7lneg4ftAoWS5AOflkkKCwZGF4TJIuqDjq4W4VBw=";
|
|
};
|
|
|
|
dontUseCmakeConfigure = true;
|
|
|
|
nativeBuildInputs = [
|
|
cmake
|
|
pkg-config
|
|
];
|
|
|
|
build-system = [
|
|
poetry-core
|
|
];
|
|
|
|
env.NIX_CFLAGS_COMPILE = "-I${lib.getDev utf8cpp}/include/utf8cpp";
|
|
|
|
buildInputs = [
|
|
pybind11
|
|
cxxopts
|
|
libjpeg
|
|
loguru-cpp
|
|
nlohmann_json
|
|
qpdf
|
|
utf8cpp
|
|
zlib
|
|
];
|
|
|
|
env.USE_SYSTEM_DEPS = true;
|
|
|
|
cmakeFlags = [
|
|
"-DUSE_SYSTEM_DEPS=True"
|
|
];
|
|
|
|
dependencies = [
|
|
tabulate
|
|
];
|
|
|
|
pythonImportsCheck = [
|
|
"docling_parse"
|
|
];
|
|
|
|
nativeCheckInputs = [
|
|
pytestCheckHook
|
|
];
|
|
|
|
meta = {
|
|
changelog = "https://github.com/DS4SD/docling-parse/blob/${src.rev}/CHANGELOG.md";
|
|
description = "Simple package to extract text with coordinates from programmatic PDFs";
|
|
homepage = "https://github.com/DS4SD/docling-parse";
|
|
license = lib.licenses.mit;
|
|
maintainers = with lib.maintainers; [ drupol ];
|
|
};
|
|
}
|