2024-09-19 14:19:46 +00:00
|
|
|
{
|
|
|
|
lib,
|
|
|
|
python3Packages,
|
|
|
|
fetchzip,
|
|
|
|
writeScript,
|
|
|
|
}:
|
2020-04-24 23:36:52 +00:00
|
|
|
|
2024-09-19 14:19:46 +00:00
|
|
|
python3Packages.buildPythonApplication rec {
|
2020-04-24 23:36:52 +00:00
|
|
|
pname = "pdf-parser";
|
2024-09-19 14:19:46 +00:00
|
|
|
version = "0.7.9";
|
|
|
|
pyproject = false;
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
|
|
src = fetchzip {
|
2024-09-19 14:19:46 +00:00
|
|
|
url = "https://didierstevens.com/files/software/pdf-parser_V${
|
|
|
|
lib.replaceStrings [ "." ] [ "_" ] version
|
|
|
|
}.zip";
|
|
|
|
hash = "sha256-1mFThtTe1LKkM/MML44RgskGv3FZborNVBsTqSKanks=";
|
2020-04-24 23:36:52 +00:00
|
|
|
};
|
|
|
|
|
2024-09-19 14:19:46 +00:00
|
|
|
postPatch = ''
|
|
|
|
# quote regular expressions correctly
|
|
|
|
substituteInPlace pdf-parser.py \
|
|
|
|
--replace-fail \
|
|
|
|
"re.sub('" \
|
|
|
|
"re.sub(r'" \
|
|
|
|
--replace-fail \
|
|
|
|
"re.match('" \
|
|
|
|
"re.match(r'"
|
|
|
|
'';
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
|
|
installPhase = ''
|
|
|
|
install -Dm555 pdf-parser.py $out/bin/pdf-parser.py
|
|
|
|
'';
|
|
|
|
|
|
|
|
preFixup = ''
|
|
|
|
substituteInPlace $out/bin/pdf-parser.py \
|
2024-09-19 14:19:46 +00:00
|
|
|
--replace-fail '/usr/bin/python' '${python3Packages.python}/bin/python'
|
|
|
|
'';
|
|
|
|
|
|
|
|
passthru.updateScript = writeScript "update-pdf-parser" ''
|
|
|
|
#!/usr/bin/env nix-shell
|
|
|
|
#!nix-shell -i bash -p common-updater-scripts curl pcre2
|
|
|
|
|
|
|
|
set -eu -o pipefail
|
|
|
|
|
|
|
|
version="$(curl -s https://blog.didierstevens.com/programs/pdf-tools/ |
|
|
|
|
pcre2grep -O '$1.$2.$3' '\bpdf-parser_V(\d+)_(\d+)_(\d+)\.zip\b.*')"
|
|
|
|
|
|
|
|
update-source-version "$UPDATE_NIX_ATTR_PATH" "$version"
|
2020-04-24 23:36:52 +00:00
|
|
|
'';
|
|
|
|
|
2024-09-19 14:19:46 +00:00
|
|
|
meta = {
|
2020-04-24 23:36:52 +00:00
|
|
|
description = "Parse a PDF document";
|
|
|
|
longDescription = ''
|
|
|
|
This tool will parse a PDF document to identify the fundamental elements used in the analyzed file.
|
|
|
|
It will not render a PDF document.
|
|
|
|
'';
|
|
|
|
homepage = "https://blog.didierstevens.com/programs/pdf-tools/";
|
2024-09-19 14:19:46 +00:00
|
|
|
license = lib.licenses.publicDomain;
|
|
|
|
maintainers = [ lib.maintainers.lightdiscord ];
|
|
|
|
platforms = lib.platforms.all;
|
2024-01-02 11:29:13 +00:00
|
|
|
mainProgram = "pdf-parser.py";
|
2020-04-24 23:36:52 +00:00
|
|
|
};
|
|
|
|
}
|