python-dask/python-dask.spec

260 lines
9.7 KiB
RPMSpec
Raw Permalink Normal View History

2019-03-07 00:58:51 +00:00
%global srcname dask
# Requires distributed, which is a loop.
2019-09-14 07:48:43 +00:00
# Also, some tests require packages that require dask itself.
2019-03-07 00:58:51 +00:00
# Force bootstrap for package review.
2019-07-23 05:48:25 +00:00
%bcond_without bootstrap
2019-03-07 00:58:51 +00:00
# We have an arched package to detect arch-dependent issues in dependencies,
# but all of the installable RPMs are noarch and there is no compiled code.
%global debug_package %{nil}
2019-03-07 00:58:51 +00:00
Name: python-%{srcname}
2023-05-08 03:22:38 +00:00
Version: 2023.4.1
%global tag 2023.4.1
Release: %autorelease -e 0.riscv64
2019-03-07 00:58:51 +00:00
Summary: Parallel PyData with Task Scheduling
2023-01-22 05:57:56 +00:00
License: BSD-3-Clause
2022-07-25 21:36:28 +00:00
URL: https://github.com/dask/dask
Source0: %{pypi_source %{srcname}}
# https://github.com/dask/dask/issues/6725
Patch: 0001-Skip-test_encoding_gh601-on-big-endian-machines.patch
2023-05-08 03:22:38 +00:00
# Fedora-specific patch.
Patch: 0002-Skip-coverage-testing.patch
2019-03-07 00:58:51 +00:00
%description
Dask is a flexible parallel computing library for analytics.
%package -n python3-%{srcname}
Summary: %{summary}
BuildArch: noarch
2019-03-07 00:58:51 +00:00
BuildRequires: python3-devel
BuildRequires: python3dist(graphviz)
BuildRequires: python3dist(ipython)
2019-07-23 06:43:50 +00:00
%if %{without bootstrap}
2019-09-14 07:48:43 +00:00
BuildRequires: python3dist(scikit-image)
BuildRequires: python3dist(xarray)
2019-03-07 00:58:51 +00:00
%endif
2019-09-14 07:48:43 +00:00
# Optional test requirements.
# Fastavro does not support 32 bit architectures and is ExcludeArch:
# https://bugzilla.redhat.com/show_bug.cgi?id=1943932
%ifnarch %{arm32} %{ix86}
2019-09-14 07:48:43 +00:00
BuildRequires: python3dist(fastavro)
%endif
2019-09-14 07:48:43 +00:00
BuildRequires: python3dist(h5py)
BuildRequires: python3dist(psutil)
# libarrow does not support 32 bit architectures and is ExcludeArch.
# Tests don't pass on s390x either.
%ifnarch %{arm} %{ix86} s390x
BuildRequires: python3dist(pyarrow)
%endif
2019-09-14 07:48:43 +00:00
BuildRequires: python3dist(requests)
BuildRequires: python3dist(sqlalchemy)
BuildRequires: python3dist(tables)
2019-09-14 07:48:43 +00:00
BuildRequires: python3dist(zarr)
2019-03-07 00:58:51 +00:00
Recommends: python3-%{srcname}+array = %{version}-%{release}
Recommends: python3-%{srcname}+bag = %{version}-%{release}
Recommends: python3-%{srcname}+dataframe = %{version}-%{release}
Recommends: python3-%{srcname}+delayed = %{version}-%{release}
2019-11-13 03:04:07 +00:00
%if %{without bootstrap}
Recommends: python3-%{srcname}+distributed = %{version}-%{release}
2019-11-13 03:04:07 +00:00
%endif
# No recent enough Bokeh is packaged
Obsoletes: python3-%{srcname}+diagnostics < 2022.5.0-1
# There is nothing that can be unbundled; there are some some snippets forked
2023-01-22 05:57:56 +00:00
# or copied from unspecified versions of numpy, under a BSD-3-Clause license
# similar to that of dask itself.
#
# - dask/array/numpy_compat.py:
# _Recurser, moveaxis, rollaxis, sliding_window_view
# - dask/array/backends.py:
# _tensordot
# - dask/array/core.py:
# block
# - dask/array/einsumfuncs.py:
# parse_einsum_input
# - dask/array/routines.py:
# cov, _average
Provides: bundled(numpy)
%description -n python3-%{srcname}
Dask is a flexible parallel computing library for analytics.
%pyproject_extras_subpkg -n python3-%{srcname} array bag dataframe delayed
2019-11-13 03:04:07 +00:00
%if %{without bootstrap}
2021-08-21 20:10:35 +00:00
%pyproject_extras_subpkg distributed
2019-11-13 03:04:07 +00:00
%endif
2019-03-07 00:58:51 +00:00
2019-07-23 06:43:50 +00:00
%if %{without bootstrap}
2019-03-07 00:58:51 +00:00
%package -n python-%{srcname}-doc
Summary: dask documentation
BuildArch: noarch
2021-01-19 07:33:52 +00:00
BuildRequires: python3dist(dask_sphinx_theme) >= 1.3.5
2019-03-07 00:58:51 +00:00
BuildRequires: python3dist(numpydoc)
2021-08-21 20:10:35 +00:00
BuildRequires: python3dist(sphinx) >= 4
2019-03-07 00:58:51 +00:00
%description -n python-%{srcname}-doc
2021-06-17 10:24:36 +00:00
Documentation for dask.
2019-03-07 00:58:51 +00:00
%endif
%prep
%autosetup -n %{srcname}-%{version} -p1
2022-06-21 10:03:36 +00:00
# we don't use pre-commit when running tests
sed -i '/"pre-commit"/d' setup.py
2019-03-07 00:58:51 +00:00
2021-08-21 20:10:35 +00:00
%generate_buildrequires
%pyproject_buildrequires -r -x test,array,bag,dataframe,delayed
2021-08-21 20:10:35 +00:00
%if %{without bootstrap}
%pyproject_buildrequires -x distributed
%endif
2019-03-07 00:58:51 +00:00
%build
2021-08-21 20:10:35 +00:00
%pyproject_wheel
2019-03-07 00:58:51 +00:00
2019-07-23 06:43:50 +00:00
%if %{without bootstrap}
2019-03-07 00:58:51 +00:00
# generate html docs
PYTHONPATH=${PWD} sphinx-build-3 docs/source html
# remove the sphinx-build leftovers
rm -rf html/.{doctrees,buildinfo}
%endif
%install
2021-08-21 20:10:35 +00:00
%pyproject_install
%pyproject_save_files %{srcname}
2019-03-07 00:58:51 +00:00
%check
2021-06-17 10:24:36 +00:00
%ifarch arm
# Is there a way to do this in one line?
%global have_arm 1
2019-09-14 07:48:43 +00:00
%endif
2019-03-07 00:58:51 +00:00
%if 0%{?__isa_bits} == 32
# read_sql_query with meta converts dtypes from 32 to 64.
# https://github.com/dask/dask/issues/8620
# > tm.assert_frame_equal(
# a, b, check_names=check_names, check_dtype=check_dtype, **kwargs
# E AssertionError: Attributes of DataFrame.iloc[:, 1] (column name="age") are different
# E
# E Attribute "dtype" are different
# E [left]: int32
# E [right]: int64
# dask/dataframe/utils.py:555: AssertionError
k="${k-}${k+ and }not test_query_with_meta"
%endif
%ifarch ppc64le
# TODO: Should this be reported upstream? Is it a dask issue, or a numpy one?
# Possibly related to
# https://fedoraproject.org/wiki/Changes/PPC64LE_Float128_Transition?
# > assert allclose(a, b, equal_nan=equal_nan, **kwargs), msg
# E AssertionError: found values in 'a' and 'b' which differ by more than the allowed amount
# E assert False
# E + where False = allclose(array([0.12586355-0.09957204j, 0.20256483+0.04098342j,\n 0.05781123-0.03588671j, 0.01135963-0.03334219j,\n 0.03747771+0.07495994j, 0.2106574 -0.0363521j ,\n 0.16352091+0.03782915j, 0.1381678 -0.06815128j,\n 0.03781295-0.04011523j, 0.01493269+0.07780643j]), array([0.12559072-0.07164038j, 0.20256483+0.05438578j,\n 0.05781123-0.03588671j, 0.01135963-0.03334219j,\n 0.03747771+0.07495994j, 0.2106574 -0.0363521j ,\n 0.16352091+0.03782915j, 0.1381678 -0.06815128j,\n 0.03781295-0.04011523j, 0.01493269+0.07780643j]), equal_nan=True, **{})
# dask/array/utils.py:361: AssertionError
k="${k-}${k+ and }not test_lstsq[100-10-10-True]"
# > assert allclose(a, b, equal_nan=equal_nan, **kwargs), msg
# E AssertionError: found values in 'a' and 'b' which differ by more than the allowed amount
# E assert False
# E + where False = allclose(array([ 0.20168675+0.08857556j, 0.144233 -0.19173091j,\n -0.03367557-0.08053959j, 0.04108325-0.24648308j,\n -0.01844576+0.00841932j, 0.29652375+0.05682199j,\n 0.05551828+0.20156798j, -0.08409592+0.02354949j,\n 0.09848743-0.00748637j, 0.22889193-0.07372773j]), array([ 0.20067551+0.2642591j , 0.144233 -0.18573336j,\n -0.03367557-0.08053959j, 0.04108325-0.24648308j,\n -0.01844576+0.00841932j, 0.29652375+0.05682199j,\n 0.05551828+0.20156798j, -0.08409592+0.02354949j,\n 0.09848743-0.00748637j, 0.22889193-0.07372773j]), equal_nan=True, **{})
# dask/array/utils.py:361: AssertionError
k="${k-}${k+ and }not test_lstsq[20-10-5-True]"
# test_vdot fails with NumPy 1.19.0
# https://github.com/dask/dask/issues/6406
#
# vdot returns incorrect results on ppc64le
# https://github.com/numpy/numpy/issues/17087
# > assert allclose(a, b, equal_nan=equal_nan, **kwargs), msg
# E AssertionError: found values in 'a' and 'b' which differ by more than the allowed amount
# E assert False
# E + where False = allclose((0.38772781971416226-0.6851997484294434j), (0.38772781971416226-0.306563166009585j), equal_nan=True, **{})
# dask/array/utils.py:361: AssertionError
k="${k-}${k+ and }not test_vdot[shape0-chunks0]"
# > assert allclose(a, b, equal_nan=equal_nan, **kwargs), msg
# E AssertionError: found values in 'a' and 'b' which differ by more than the allowed amount
# E assert False
# E + where False = allclose((0.38772781971416226-0.6851997484294434j), (0.38772781971416226-0.306563166009585j), equal_nan=True, **{})
# dask/array/utils.py:361: AssertionError
k="${k-}${k+ and }not test_vdot[shape1-chunks1]"
%endif
# This test compares against files in .github/. It does not work on the PyPI
# sdist, and is only relevant to upstream CI anyway.
#
# test_development_guidelines_matches_ci fails from sdist
# https://github.com/dask/dask/issues/8499
k="${k-}${k+ and }not test_development_guidelines_matches_ci"
%ifarch riscv64
# RISCV failing tests
k="${k-}${k+ and }not test_datetime_std_with_larger_dataset[None-True-1]"
k="${k-}${k+ and }not test_dir_filter[pyarrow]"
k="${k-}${k+ and }not test_append_with_partition[pyarrow]"
k="${k-}${k+ and }not test_series_aggregations_multilevel[prod-disk-1-<lambda>2]"
k="${k-}${k+ and }not test_series_aggregations_multilevel[prod-disk-2-<lambda>2]"
k="${k-}${k+ and }not test_series_aggregations_multilevel[prod-tasks-1-<lambda>2]"
k="${k-}${k+ and }not test_series_aggregations_multilevel[prod-tasks-2-<lambda>2]"
k="${k-}${k+ and }not test_groupby_reduction_split[prod-disk-split_every]"
k="${k-}${k+ and }not test_groupby_reduction_split[prod-disk-split_out]"
k="${k-}${k+ and }not test_groupby_reduction_split[prod-tasks-split_every]"
k="${k-}${k+ and }not test_groupby_reduction_split[prod-tasks-split_out]"
k="${k-}${k+ and }not test_concat_dataframe_empty"
k="${k-}${k+ and }not test_dataframe_aggregations_multilevel[prod-disk-1-<lambda>4]"
k="${k-}${k+ and }not test_dataframe_aggregations_multilevel[prod-disk-2-<lambda>4]"
k="${k-}${k+ and }not test_dataframe_aggregations_multilevel[prod-tasks-1-<lambda>4]"
k="${k-}${k+ and }not test_dataframe_aggregations_multilevel[prod-tasks-2-<lambda>4]"
k="${k-}${k+ and }not test_categorical_merge_with_merge_column_cat_in_one_and_not_other_upcasts"
%endif
2021-06-17 10:24:36 +00:00
pytest_args=(
-m 'not network'
-n %[0%{?have_arm}?"2":"auto"]
2022-01-16 00:20:12 +00:00
2023-03-28 08:37:06 +00:00
%ifarch %{ix86}
# Ignore 32-bit warning
-W 'ignore:invalid value encountered in cast:RuntimeWarning'
%endif
-k "${k-}"
2023-01-22 05:57:56 +00:00
--pyargs dask
2021-06-17 10:24:36 +00:00
)
2023-01-22 05:57:56 +00:00
cd docs
2021-06-17 10:24:36 +00:00
%{pytest} "${pytest_args[@]}"
2019-03-07 00:58:51 +00:00
2021-08-21 20:10:35 +00:00
%files -n python3-%{srcname} -f %{pyproject_files}
2019-03-07 00:58:51 +00:00
%doc README.rst
%license LICENSE.txt dask/array/NUMPY_LICENSE.txt
2022-10-16 23:30:04 +00:00
%{_bindir}/dask
2019-07-23 06:43:50 +00:00
%if %{without bootstrap}
2019-03-07 00:58:51 +00:00
%files -n python-%{srcname}-doc
%doc html
%license LICENSE.txt dask/array/NUMPY_LICENSE.txt
2019-03-07 00:58:51 +00:00
%endif
%changelog
2021-07-31 07:34:37 +00:00
%autochangelog