{ lib , stdenv , fetchFromGitHub , buildNpmPackage , nixosTests , gettext , python3 , giflib , darwin , ghostscript_headless , imagemagickBig , jbig2enc , optipng , pngquant , qpdf , tesseract5 , unpaper , poppler_utils , liberation_ttf , xcbuild , pango , pkg-config , nltk-data }: let version = "2.10.1"; src = fetchFromGitHub { owner = "paperless-ngx"; repo = "paperless-ngx"; rev = "refs/tags/v${version}"; hash = "sha256-M1S5ebdpw11Ot4h4xvbk/rbJxXom2dZ5Of+6eOlBIuE="; }; # subpath installation is broken with uvicorn >= 0.26 # https://github.com/NixOS/nixpkgs/issues/298719 # https://github.com/paperless-ngx/paperless-ngx/issues/5494 python = python3.override { packageOverrides = final: prev: { # tesseract5 may be overwritten in the paperless module and we need to propagate that to make the closure reduction effective ocrmypdf = prev.ocrmypdf.override { tesseract = tesseract5; }; uvicorn = prev.uvicorn.overridePythonAttrs (_: { version = "0.25.0"; src = fetchFromGitHub { owner = "encode"; repo = "uvicorn"; rev = "0.25.0"; hash = "sha256-ng98DTw49zyFjrPnEwfnPfONyjKKZYuLl0qduxSppYk="; }; }); djangorestframework = prev.djangorestframework.overridePythonAttrs (oldAttrs: rec { version = "3.14.0"; src = oldAttrs.src.override { rev = version; hash = "sha256-Fnj0n3NS3SetOlwSmGkLE979vNJnYE6i6xwVBslpNz4="; }; nativeCheckInputs = with prev; [ pytest7CheckHook pytest-django ]; }); }; }; path = lib.makeBinPath [ ghostscript_headless imagemagickBig jbig2enc optipng pngquant qpdf tesseract5 unpaper poppler_utils ]; frontend = buildNpmPackage { pname = "paperless-ngx-frontend"; inherit version src; postPatch = '' cd src-ui ''; npmDepsHash = "sha256-zmlYwlH2cnGbbKf6jt5zBLh0Iv3C9/xN0iA4xVetRNE="; nativeBuildInputs = [ pkg-config python3 ] ++ lib.optionals stdenv.isDarwin [ xcbuild ]; buildInputs = [ pango ] ++ lib.optionals stdenv.isDarwin [ giflib darwin.apple_sdk.frameworks.CoreText ]; CYPRESS_INSTALL_BINARY = "0"; NG_CLI_ANALYTICS = "false"; npmBuildFlags = [ "--" "--configuration" "production" ]; doCheck = true; checkPhase = '' runHook preCheck npm run test runHook postCheck ''; installPhase = '' runHook preInstall mkdir -p $out/lib/paperless-ui mv ../src/documents/static/frontend $out/lib/paperless-ui/ runHook postInstall ''; }; in python.pkgs.buildPythonApplication rec { pname = "paperless-ngx"; format = "other"; inherit version src; nativeBuildInputs = [ gettext ]; propagatedBuildInputs = with python.pkgs; [ bleach channels channels-redis concurrent-log-handler dateparser django django-allauth django-auditlog django-celery-results django-compression-middleware django-cors-headers django-extensions django-filter django-guardian django-multiselectfield django-soft-delete djangorestframework djangorestframework-guardian2 drf-writable-nested filelock flower gotenberg-client gunicorn imap-tools inotifyrecursive langdetect mysqlclient nltk ocrmypdf pathvalidate pdf2image psycopg python-dateutil python-dotenv python-gnupg python-ipware python-magic pyzbar rapidfuzz redis scikit-learn setproctitle tika-client tqdm uvicorn watchdog whitenoise whoosh zxing-cpp ] ++ redis.optional-dependencies.hiredis ++ uvicorn.optional-dependencies.standard; postBuild = '' # Compile manually because `pythonRecompileBytecodeHook` only works # for files in `python.sitePackages` ${python.pythonOnBuildForHost.interpreter} -OO -m compileall src # Collect static files ${python.pythonOnBuildForHost.interpreter} src/manage.py collectstatic --clear --no-input # Compile string translations using gettext ${python.pythonOnBuildForHost.interpreter} src/manage.py compilemessages ''; installPhase = let pythonPath = python.pkgs.makePythonPath propagatedBuildInputs; in '' runHook preInstall mkdir -p $out/lib/paperless-ngx cp -r {src,static,LICENSE,gunicorn.conf.py} $out/lib/paperless-ngx ln -s ${frontend}/lib/paperless-ui/frontend $out/lib/paperless-ngx/static/ chmod +x $out/lib/paperless-ngx/src/manage.py makeWrapper $out/lib/paperless-ngx/src/manage.py $out/bin/paperless-ngx \ --prefix PYTHONPATH : "${pythonPath}" \ --prefix PATH : "${path}" makeWrapper ${python.pkgs.celery}/bin/celery $out/bin/celery \ --prefix PYTHONPATH : "${pythonPath}:$out/lib/paperless-ngx/src" \ --prefix PATH : "${path}" runHook postInstall ''; postFixup = '' # Remove tests with samples (~14M) find $out/lib/paperless-ngx -type d -name tests -exec rm -rv {} + ''; nativeCheckInputs = with python.pkgs; [ daphne factory-boy imagehash pytest-django pytest-env pytest-httpx pytest-rerunfailures pytest-xdist pytestCheckHook ]; pytestFlagsArray = [ "src" ]; # The tests require: # - PATH with runtime binaries # - A temporary HOME directory for gnupg # - XDG_DATA_DIRS with test-specific fonts preCheck = '' export PATH="${path}:$PATH" export HOME=$(mktemp -d) export XDG_DATA_DIRS="${liberation_ttf}/share:$XDG_DATA_DIRS" # Disable unneeded code coverage test substituteInPlace src/setup.cfg \ --replace-fail "--cov --cov-report=html --cov-report=xml" "" ''; disabledTests = [ # FileNotFoundError(2, 'No such file or directory'): /build/tmp... "test_script_with_output" "test_script_exit_non_zero" # AssertionError: 10 != 4 (timezone/time issue) # Due to getting local time from modification date in test_consumer.py "testNormalOperation" # Something broken with new Tesseract and inline RTL/LTR overrides? "test_rtl_language_detection" ]; doCheck = !stdenv.isDarwin; passthru = { inherit python path frontend tesseract5; nltkData = with nltk-data; [ punkt snowball_data stopwords ]; tests = { inherit (nixosTests) paperless; }; }; meta = with lib; { description = "Tool to scan, index, and archive all of your physical documents"; homepage = "https://docs.paperless-ngx.com/"; changelog = "https://github.com/paperless-ngx/paperless-ngx/releases/tag/v${version}"; license = licenses.gpl3Only; platforms = platforms.unix; maintainers = with maintainers; [ lukegb gador erikarvstedt leona ]; }; }