2024-06-05 15:53:02 +00:00
|
|
|
{
|
|
|
|
lib,
|
|
|
|
stdenv,
|
|
|
|
buildPythonPackage,
|
|
|
|
fetchFromGitHub,
|
|
|
|
pythonAtLeast,
|
|
|
|
pythonOlder,
|
2023-08-10 07:59:29 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
# build-system
|
|
|
|
cython,
|
|
|
|
meson-python,
|
|
|
|
meson,
|
|
|
|
oldest-supported-numpy,
|
|
|
|
pkg-config,
|
|
|
|
versioneer,
|
|
|
|
wheel,
|
2023-08-10 07:59:29 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
# propagates
|
|
|
|
numpy,
|
|
|
|
python-dateutil,
|
|
|
|
pytz,
|
|
|
|
tzdata,
|
2023-08-10 07:59:29 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
# optionals
|
|
|
|
beautifulsoup4,
|
|
|
|
bottleneck,
|
|
|
|
blosc2,
|
|
|
|
fsspec,
|
|
|
|
gcsfs,
|
|
|
|
html5lib,
|
|
|
|
jinja2,
|
|
|
|
lxml,
|
|
|
|
matplotlib,
|
|
|
|
numba,
|
|
|
|
numexpr,
|
|
|
|
odfpy,
|
|
|
|
openpyxl,
|
|
|
|
psycopg2,
|
|
|
|
pyarrow,
|
|
|
|
pymysql,
|
|
|
|
pyqt5,
|
|
|
|
pyreadstat,
|
|
|
|
qtpy,
|
|
|
|
s3fs,
|
|
|
|
scipy,
|
|
|
|
sqlalchemy,
|
|
|
|
tables,
|
|
|
|
tabulate,
|
|
|
|
xarray,
|
|
|
|
xlrd,
|
|
|
|
xlsxwriter,
|
|
|
|
zstandard,
|
2023-08-10 07:59:29 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
# tests
|
|
|
|
adv_cmds,
|
|
|
|
glibc,
|
|
|
|
glibcLocales,
|
|
|
|
hypothesis,
|
|
|
|
pytestCheckHook,
|
|
|
|
pytest-xdist,
|
|
|
|
pytest-asyncio,
|
|
|
|
python,
|
|
|
|
runtimeShell,
|
2020-04-24 23:36:52 +00:00
|
|
|
}:
|
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
let
|
|
|
|
pandas = buildPythonPackage rec {
|
|
|
|
pname = "pandas";
|
|
|
|
version = "2.2.1";
|
|
|
|
pyproject = true;
|
2023-08-10 07:59:29 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
disabled = pythonOlder "3.9";
|
2020-04-24 23:36:52 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
src = fetchFromGitHub {
|
|
|
|
owner = "pandas-dev";
|
|
|
|
repo = "pandas";
|
|
|
|
rev = "refs/tags/v${version}";
|
|
|
|
hash = "sha256-eyVUIYG0KCAEJbh/qZiEjGpdXq7A+2Lab+5bp+7t4cw=";
|
|
|
|
};
|
2020-04-24 23:36:52 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
postPatch = ''
|
|
|
|
substituteInPlace pyproject.toml \
|
|
|
|
--replace-fail "Cython==3.0.5" "Cython>=3.0.5" \
|
|
|
|
--replace-fail "meson-python==0.13.1" "meson-python>=0.13.1" \
|
|
|
|
--replace-fail "meson==1.2.1" "meson>=1.2.1"
|
|
|
|
'';
|
2023-11-16 04:20:00 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
nativeBuildInputs =
|
|
|
|
[
|
|
|
|
cython
|
|
|
|
meson-python
|
|
|
|
meson
|
|
|
|
numpy
|
|
|
|
pkg-config
|
|
|
|
versioneer
|
|
|
|
wheel
|
|
|
|
]
|
|
|
|
++ versioneer.optional-dependencies.toml
|
|
|
|
++ lib.optionals (pythonOlder "3.12") [ oldest-supported-numpy ];
|
2021-03-09 03:18:52 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
enableParallelBuilding = true;
|
2021-03-09 03:18:52 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
propagatedBuildInputs = [
|
|
|
|
numpy
|
|
|
|
python-dateutil
|
|
|
|
pytz
|
|
|
|
tzdata
|
|
|
|
];
|
2020-04-24 23:36:52 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
passthru.optional-dependencies =
|
|
|
|
let
|
|
|
|
extras = {
|
|
|
|
aws = [ s3fs ];
|
|
|
|
clipboard = [
|
|
|
|
pyqt5
|
|
|
|
qtpy
|
|
|
|
];
|
|
|
|
compression = [ zstandard ];
|
|
|
|
computation = [
|
|
|
|
scipy
|
|
|
|
xarray
|
|
|
|
];
|
|
|
|
excel = [
|
|
|
|
odfpy
|
|
|
|
openpyxl
|
|
|
|
# TODO: pyxlsb
|
|
|
|
xlrd
|
|
|
|
xlsxwriter
|
|
|
|
];
|
|
|
|
feather = [ pyarrow ];
|
|
|
|
fss = [ fsspec ];
|
|
|
|
gcp = [
|
|
|
|
gcsfs
|
|
|
|
# TODO: pandas-gqb
|
|
|
|
];
|
|
|
|
hdf5 = [
|
|
|
|
blosc2
|
|
|
|
tables
|
|
|
|
];
|
|
|
|
html = [
|
|
|
|
beautifulsoup4
|
|
|
|
html5lib
|
|
|
|
lxml
|
|
|
|
];
|
|
|
|
mysql = [
|
|
|
|
sqlalchemy
|
|
|
|
pymysql
|
|
|
|
];
|
|
|
|
output_formatting = [
|
|
|
|
jinja2
|
|
|
|
tabulate
|
|
|
|
];
|
|
|
|
parquet = [ pyarrow ];
|
|
|
|
performance = [
|
|
|
|
bottleneck
|
|
|
|
numba
|
|
|
|
numexpr
|
|
|
|
];
|
|
|
|
plot = [ matplotlib ];
|
|
|
|
postgresql = [
|
|
|
|
sqlalchemy
|
|
|
|
psycopg2
|
|
|
|
];
|
|
|
|
spss = [ pyreadstat ];
|
|
|
|
sql-other = [ sqlalchemy ];
|
|
|
|
xml = [ lxml ];
|
|
|
|
};
|
|
|
|
in
|
|
|
|
extras // { all = lib.concatLists (lib.attrValues extras); };
|
2023-08-10 07:59:29 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
doCheck = false; # various infinite recursions
|
2024-01-13 08:15:51 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
passthru.tests.pytest = pandas.overridePythonAttrs (_: {
|
|
|
|
doCheck = true;
|
|
|
|
});
|
2024-01-13 08:15:51 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
nativeCheckInputs =
|
|
|
|
[
|
|
|
|
glibcLocales
|
|
|
|
hypothesis
|
|
|
|
pytest-asyncio
|
|
|
|
pytest-xdist
|
|
|
|
pytestCheckHook
|
|
|
|
]
|
|
|
|
++ lib.flatten (lib.attrValues passthru.optional-dependencies)
|
|
|
|
++ lib.optionals (stdenv.isLinux) [
|
|
|
|
# for locale executable
|
|
|
|
glibc
|
|
|
|
]
|
|
|
|
++ lib.optionals (stdenv.isDarwin) [
|
|
|
|
# for locale executable
|
|
|
|
adv_cmds
|
|
|
|
];
|
2020-11-19 00:13:47 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
# don't max out build cores, it breaks tests
|
|
|
|
dontUsePytestXdist = true;
|
2022-04-27 09:35:20 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
__darwinAllowLocalNetworking = true;
|
2023-08-10 07:59:29 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
pytestFlagsArray = [
|
|
|
|
# https://github.com/pandas-dev/pandas/blob/main/test_fast.sh
|
|
|
|
"-m"
|
|
|
|
"'not single_cpu and not slow and not network and not db and not slow_arm'"
|
|
|
|
# https://github.com/pandas-dev/pandas/issues/54907
|
|
|
|
"--no-strict-data-files"
|
|
|
|
"--numprocesses"
|
|
|
|
"4"
|
|
|
|
];
|
2021-03-09 03:18:52 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
disabledTests =
|
|
|
|
[
|
|
|
|
# AssertionError: Did not see expected warning of class 'FutureWarning'
|
|
|
|
"test_parsing_tzlocal_deprecated"
|
|
|
|
]
|
|
|
|
++ lib.optionals (stdenv.isDarwin && stdenv.isAarch64) [
|
|
|
|
# tests/generic/test_finalize.py::test_binops[and_-args4-right] - AssertionError: assert {} == {'a': 1}
|
|
|
|
"test_binops"
|
|
|
|
# These tests are unreliable on aarch64-darwin. See https://github.com/pandas-dev/pandas/issues/38921.
|
|
|
|
"test_rolling"
|
|
|
|
]
|
|
|
|
++ lib.optional stdenv.is32bit [
|
|
|
|
# https://github.com/pandas-dev/pandas/issues/37398
|
|
|
|
"test_rolling_var_numerical_issues"
|
|
|
|
];
|
2020-04-24 23:36:52 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
# Tests have relative paths, and need to reference compiled C extensions
|
|
|
|
# so change directory where `import .test` is able to be resolved
|
|
|
|
preCheck =
|
|
|
|
''
|
|
|
|
export HOME=$TMPDIR
|
|
|
|
export LC_ALL="en_US.UTF-8"
|
|
|
|
cd $out/${python.sitePackages}/pandas
|
|
|
|
''
|
|
|
|
# TODO: Get locale and clipboard support working on darwin.
|
|
|
|
# Until then we disable the tests.
|
|
|
|
+ lib.optionalString stdenv.isDarwin ''
|
|
|
|
# Fake the impure dependencies pbpaste and pbcopy
|
|
|
|
echo "#!${runtimeShell}" > pbcopy
|
|
|
|
echo "#!${runtimeShell}" > pbpaste
|
|
|
|
chmod a+x pbcopy pbpaste
|
|
|
|
export PATH=$(pwd):$PATH
|
|
|
|
'';
|
2020-04-24 23:36:52 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
pythonImportsCheck = [ "pandas" ];
|
2021-03-09 03:18:52 +00:00
|
|
|
|
2024-06-05 15:53:02 +00:00
|
|
|
meta = with lib; {
|
|
|
|
# pandas devs no longer test i686, it's commonly broken
|
|
|
|
# broken = stdenv.isi686;
|
|
|
|
changelog = "https://pandas.pydata.org/docs/whatsnew/index.html";
|
|
|
|
description = "Powerful data structures for data analysis, time series, and statistics";
|
|
|
|
downloadPage = "https://github.com/pandas-dev/pandas";
|
|
|
|
homepage = "https://pandas.pydata.org";
|
|
|
|
license = licenses.bsd3;
|
|
|
|
longDescription = ''
|
|
|
|
Flexible and powerful data analysis / manipulation library for
|
|
|
|
Python, providing labeled data structures similar to R data.frame
|
|
|
|
objects, statistical functions, and much more.
|
|
|
|
'';
|
|
|
|
maintainers = with maintainers; [
|
|
|
|
raskin
|
|
|
|
knedlsepp
|
|
|
|
];
|
|
|
|
};
|
2020-04-24 23:36:52 +00:00
|
|
|
};
|
2024-06-05 15:53:02 +00:00
|
|
|
in
|
|
|
|
pandas
|