depot/third_party/nixpkgs/pkgs/development/python-modules/pandas/default.nix
Default email 7e47f3658e Project import generated by Copybara.
GitOrigin-RevId: 1925c603f17fc89f4c8f6bf6f631a802ad85d784
2024-09-26 11:04:55 +00:00

267 lines
6.2 KiB
Nix

{
lib,
stdenv,
buildPythonPackage,
fetchFromGitHub,
pythonAtLeast,
pythonOlder,
# build-system
cython,
meson-python,
meson,
oldest-supported-numpy,
pkg-config,
versioneer,
wheel,
# propagates
numpy,
python-dateutil,
pytz,
tzdata,
# optionals
beautifulsoup4,
bottleneck,
blosc2,
fsspec,
gcsfs,
html5lib,
jinja2,
lxml,
matplotlib,
numba,
numexpr,
odfpy,
openpyxl,
psycopg2,
pyarrow,
pymysql,
pyqt5,
pyreadstat,
qtpy,
s3fs,
scipy,
sqlalchemy,
tables,
tabulate,
xarray,
xlrd,
xlsxwriter,
zstandard,
# tests
adv_cmds,
glibc,
glibcLocales,
hypothesis,
pytestCheckHook,
pytest-xdist,
pytest-asyncio,
python,
runtimeShell,
}:
let
pandas = buildPythonPackage rec {
pname = "pandas";
version = "2.2.2";
pyproject = true;
disabled = pythonOlder "3.9";
src = fetchFromGitHub {
owner = "pandas-dev";
repo = "pandas";
rev = "refs/tags/v${version}";
hash = "sha256-+zQKrsJmP3FJeOiYwNH1u96+/ECDHQF39evzur3cKjc=";
};
postPatch = ''
substituteInPlace pyproject.toml \
--replace-fail "Cython==3.0.5" "Cython>=3.0.5" \
--replace-fail "meson-python==0.13.1" "meson-python>=0.13.1" \
--replace-fail "meson==1.2.1" "meson>=1.2.1" \
--replace-fail "numpy>=2.0.0rc1" "numpy"
'';
nativeBuildInputs =
[
cython
meson-python
meson
numpy
pkg-config
versioneer
wheel
]
++ versioneer.optional-dependencies.toml
++ lib.optionals (pythonOlder "3.12") [ oldest-supported-numpy ];
enableParallelBuilding = true;
propagatedBuildInputs = [
numpy
python-dateutil
pytz
tzdata
];
passthru.optional-dependencies =
let
extras = {
aws = [ s3fs ];
clipboard = [
pyqt5
qtpy
];
compression = [ zstandard ];
computation = [
scipy
xarray
];
excel = [
odfpy
openpyxl
# TODO: pyxlsb
xlrd
xlsxwriter
];
feather = [ pyarrow ];
fss = [ fsspec ];
gcp = [
gcsfs
# TODO: pandas-gqb
];
hdf5 = [
blosc2
tables
];
html = [
beautifulsoup4
html5lib
lxml
];
mysql = [
sqlalchemy
pymysql
];
output_formatting = [
jinja2
tabulate
];
parquet = [ pyarrow ];
performance = [
bottleneck
numba
numexpr
];
plot = [ matplotlib ];
postgresql = [
sqlalchemy
psycopg2
];
spss = [ pyreadstat ];
sql-other = [ sqlalchemy ];
xml = [ lxml ];
};
in
extras // { all = lib.concatLists (lib.attrValues extras); };
doCheck = false; # various infinite recursions
passthru.tests.pytest = pandas.overridePythonAttrs (_: {
doCheck = true;
});
nativeCheckInputs =
[
glibcLocales
hypothesis
pytest-asyncio
pytest-xdist
pytestCheckHook
]
++ lib.flatten (lib.attrValues passthru.optional-dependencies)
++ lib.optionals (stdenv.hostPlatform.isLinux) [
# for locale executable
glibc
]
++ lib.optionals (stdenv.hostPlatform.isDarwin) [
# for locale executable
adv_cmds
];
# don't max out build cores, it breaks tests
dontUsePytestXdist = true;
__darwinAllowLocalNetworking = true;
pytestFlagsArray = [
# https://github.com/pandas-dev/pandas/blob/main/test_fast.sh
"-m"
"'not single_cpu and not slow and not network and not db and not slow_arm'"
# https://github.com/pandas-dev/pandas/issues/54907
"--no-strict-data-files"
"--numprocesses"
"4"
];
disabledTests =
[
# AssertionError: Did not see expected warning of class 'FutureWarning'
"test_parsing_tzlocal_deprecated"
]
++ lib.optionals (stdenv.hostPlatform.isDarwin && stdenv.hostPlatform.isAarch64) [
# tests/generic/test_finalize.py::test_binops[and_-args4-right] - AssertionError: assert {} == {'a': 1}
"test_binops"
# These tests are unreliable on aarch64-darwin. See https://github.com/pandas-dev/pandas/issues/38921.
"test_rolling"
]
++ lib.optional stdenv.hostPlatform.is32bit [
# https://github.com/pandas-dev/pandas/issues/37398
"test_rolling_var_numerical_issues"
];
# Tests have relative paths, and need to reference compiled C extensions
# so change directory where `import .test` is able to be resolved
preCheck =
''
export HOME=$TMPDIR
export LC_ALL="en_US.UTF-8"
cd $out/${python.sitePackages}/pandas
''
# TODO: Get locale and clipboard support working on darwin.
# Until then we disable the tests.
+ lib.optionalString stdenv.hostPlatform.isDarwin ''
# Fake the impure dependencies pbpaste and pbcopy
echo "#!${runtimeShell}" > pbcopy
echo "#!${runtimeShell}" > pbpaste
chmod a+x pbcopy pbpaste
export PATH=$(pwd):$PATH
'';
pythonImportsCheck = [ "pandas" ];
meta = with lib; {
# pandas devs no longer test i686, it's commonly broken
# broken = stdenv.hostPlatform.isi686;
changelog = "https://pandas.pydata.org/docs/whatsnew/index.html";
description = "Powerful data structures for data analysis, time series, and statistics";
downloadPage = "https://github.com/pandas-dev/pandas";
homepage = "https://pandas.pydata.org";
license = licenses.bsd3;
longDescription = ''
Flexible and powerful data analysis / manipulation library for
Python, providing labeled data structures similar to R data.frame
objects, statistical functions, and much more.
'';
maintainers = with maintainers; [
raskin
knedlsepp
];
};
};
in
pandas