summary refs log tree commit diff
path: root/gnu/packages
diff options
context:
space:
mode:
authorRicardo Wurmus <rekado@elephly.net>2021-07-28 20:29:21 +0200
committerRicardo Wurmus <rekado@elephly.net>2021-07-28 20:31:06 +0200
commit042b6971d73b6bef8b9e81ac5b9e136ea997edfd (patch)
treeef02c0ebacb0d318e34d36232f6974898559ba97 /gnu/packages
parent251bfbcfaae7c5363c752549d167c82fecfd49a7 (diff)
downloadguix-042b6971d73b6bef8b9e81ac5b9e136ea997edfd.tar.gz
gnu: Add python-modin.
* gnu/packages/python-science.scm (python-modin): New variable.
Diffstat (limited to 'gnu/packages')
-rw-r--r--gnu/packages/python-science.scm65
1 files changed, 65 insertions, 0 deletions
diff --git a/gnu/packages/python-science.scm b/gnu/packages/python-science.scm
index 3aa3edce17..738b504e3b 100644
--- a/gnu/packages/python-science.scm
+++ b/gnu/packages/python-science.scm
@@ -916,3 +916,68 @@ computing in Python.  It extends both the @code{concurrent.futures} and
 @code{dask} APIs to moderate sized clusters.")
     (license license:bsd-3)))
 
+(define-public python-modin
+  (package
+    (name "python-modin")
+    (version "0.10.1")
+    (source
+     (origin
+       ;; The archive on pypi does not include all required files.
+       (method git-fetch)
+       (uri (git-reference
+             (url "https://github.com/modin-project/modin")
+             (commit version)))
+       (file-name (git-file-name name version))
+       (sha256
+        (base32
+         "128ghfb9ncmnn8km409xjcdppvn9nr9jqw8rkvsfavh7wnwlk509"))))
+    (build-system python-build-system)
+    (arguments
+     `(#:phases
+       (modify-phases %standard-phases
+         (add-after 'unpack 'make-files-writable
+           (lambda _
+             (for-each make-file-writable (find-files "."))))
+         (replace 'check
+           (lambda* (#:key tests? #:allow-other-keys)
+             (when tests?
+               (setenv "MODIN_ENGINE" "dask")
+               (invoke "python" "-m" "pytest"
+                       "modin/pandas/test/test_concat.py")
+               (setenv "MODIN_ENGINE" "python")
+               (invoke "python" "-m" "pytest"
+                       "modin/pandas/test/test_concat.py")))))))
+    (propagated-inputs
+     `(("python-cloudpickle" ,python-cloudpickle)
+       ("python-dask" ,python-dask)
+       ("python-distributed" ,python-distributed)
+       ("python-numpy" ,python-numpy)
+       ("python-packaging" ,python-packaging)
+       ("python-pandas" ,python-pandas)))
+    (native-inputs
+     `(("python-coverage" ,python-coverage)
+       ("python-jinja2" ,python-jinja2)
+       ("python-lxml" ,python-lxml)
+       ("python-matplotlib" ,python-matplotlib)
+       ("python-msgpack" ,python-msgpack)
+       ("python-openpyxl" ,python-openpyxl)
+       ("python-psutil" ,python-psutil)
+       ("python-pyarrow" ,python-pyarrow)
+       ("python-pytest" ,python-pytest)
+       ("python-pytest-benchmark" ,python-pytest-benchmark)
+       ("python-pytest-cov" ,python-pytest-cov)
+       ("python-pytest-xdist" ,python-pytest-xdist)
+       ("python-scipy" ,python-scipy)
+       ("python-sqlalchemy" ,python-sqlalchemy)
+       ("python-tables" ,python-tables)
+       ("python-tqdm" ,python-tqdm)
+       ("python-xarray" ,python-xarray)
+       ("python-xlrd" ,python-xlrd)))
+    (home-page "https://github.com/modin-project/modin")
+    (synopsis "Make your pandas code run faster")
+    (description
+     "Modin uses Ray or Dask to provide an effortless way to speed up your
+pandas notebooks, scripts, and libraries.  Unlike other distributed DataFrame
+libraries, Modin provides seamless integration and compatibility with existing
+pandas code.")
+    (license license:asl2.0)))