gnu: Add python-vega-datasets.

* gnu/packages/statistics.scm (python-vega-datasets): New variable.
* gnu/packages/patches/python-vega-datasets-remove-la-riots-code.patch: New
file.
* gnu/local.mk (dist_patch_DATA): Register it.
This commit is contained in:
Vinicius Monego 2023-05-20 15:03:32 -03:00
parent c210dbe43e
commit 64e5e17d8c
No known key found for this signature in database
GPG key ID: 637B0B138065B68A
3 changed files with 119 additions and 0 deletions

View file

@ -1834,6 +1834,7 @@ dist_patch_DATA = \
%D%/packages/patches/python-typing-inspect-fix.patch \ %D%/packages/patches/python-typing-inspect-fix.patch \
%D%/packages/patches/python-unittest2-python3-compat.patch \ %D%/packages/patches/python-unittest2-python3-compat.patch \
%D%/packages/patches/python-unittest2-remove-argparse.patch \ %D%/packages/patches/python-unittest2-remove-argparse.patch \
%D%/packages/patches/python-vega-datasets-remove-la-riots-code.patch \
%D%/packages/patches/python-versioneer-guix-support.patch \ %D%/packages/patches/python-versioneer-guix-support.patch \
%D%/packages/patches/python-waitress-fix-tests.patch \ %D%/packages/patches/python-waitress-fix-tests.patch \
%D%/packages/patches/python-werkzeug-tests.patch \ %D%/packages/patches/python-werkzeug-tests.patch \

View file

@ -0,0 +1,89 @@
# This patch was imported from Debian:
# https://sources.debian.org/src/python-vega-datasets/0.9%2Bdfsg-1/debian/patches/remove-la-riots-related-code.patch/
# According to the Debian package, the license of this dataset is not clear and it is not available from Los Angeles Times for European users.
Index: vega_datasets/vega_datasets/tests/test_local_datasets.py
===================================================================
--- vega_datasets.orig/vega_datasets/tests/test_local_datasets.py
+++ vega_datasets/vega_datasets/tests/test_local_datasets.py
@@ -75,7 +75,6 @@ def test_cars_column_names():
[
("cars", "Year"),
("stocks", "date"),
- ("la-riots", "death_date"),
("iowa-electricity", "year"),
("seattle-weather", "date"),
("seattle-temps", "date"),
Index: vega_datasets/vega_datasets/core.py
===================================================================
--- vega_datasets.orig/vega_datasets/core.py
+++ vega_datasets/vega_datasets/core.py
@@ -322,11 +322,6 @@ class IowaElectricity(Dataset):
_pd_read_kwds = {"parse_dates": ["year"]}
-class LARiots(Dataset):
- name = "la-riots"
- _pd_read_kwds = {"parse_dates": ["death_date"]}
-
-
class Miserables(Dataset):
name = "miserables"
_return_type = tuple
Index: vega_datasets/vega_datasets/datasets.json
===================================================================
--- vega_datasets.orig/vega_datasets/datasets.json
+++ vega_datasets/vega_datasets/datasets.json
@@ -143,10 +143,6 @@
"filename": "jobs.json",
"format": "json"
},
- "la-riots": {
- "filename": "la-riots.csv",
- "format": "csv"
- },
"londonBoroughs": {
"filename": "londonBoroughs.json",
"format": "json"
@@ -279,4 +275,4 @@
"filename": "zipcodes.csv",
"format": "csv"
}
-}
\ No newline at end of file
+}
Index: vega_datasets/vega_datasets/local_datasets.json
===================================================================
--- vega_datasets.orig/vega_datasets/local_datasets.json
+++ vega_datasets/vega_datasets/local_datasets.json
@@ -8,7 +8,6 @@
"driving": "_data/driving.json",
"iowa-electricity": "_data/iowa-electricity.csv",
"iris": "_data/iris.json",
- "la-riots": "_data/la-riots.csv",
"ohlc": "_data/ohlc.json",
"seattle-temps": "_data/seattle-temps.csv",
"seattle-weather": "_data/seattle-weather.csv",
@@ -16,4 +15,4 @@
"stocks": "_data/stocks.csv",
"us-employment": "_data/us-employment.csv",
"wheat": "_data/wheat.json"
-}
\ No newline at end of file
+}
Index: vega_datasets/vega_datasets/dataset_info.json
===================================================================
--- vega_datasets.orig/vega_datasets/dataset_info.json
+++ vega_datasets/vega_datasets/dataset_info.json
@@ -49,12 +49,6 @@
"R. A. Fisher (1936). 'The use of multiple measurements in taxonomic problems'. Annals of Eugenics. 7 (2): 179-188."
]
},
- "la-riots" : {
- "description" : "More than 60 people lost their lives amid the looting and fires that ravaged Los Angeles for five days starting on April 29, 1992. This dataset contains metadata about each person, including the geographic coordinates of their death. It was compiled and published by the Los Angeles Times Data Desk [1]_.",
- "references" : [
- "http://spreadsheets.latimes.com/la-riots-deaths/"
- ]
- },
"ohlc" : {
"description" : "This dataset contains the performance of the Chicago Board Options Exchange `Volatility Index <https://en.wikipedia.org/wiki/VIX>`_ in the summer of 2009."
},

View file

@ -2026,6 +2026,35 @@ (define-public r-xtable
"This package provides tools to export R data as LaTeX and HTML tables.") "This package provides tools to export R data as LaTeX and HTML tables.")
(license license:gpl2+))) (license license:gpl2+)))
(define-public python-vega-datasets
(package
(name "python-vega-datasets")
(version "0.9.0")
(source
(origin
(method url-fetch)
(uri (pypi-uri "vega_datasets" version))
(sha256
(base32 "1h1zv607mars2j73v8fdwihjh479blqxyw29nhmc73lf40s9iglx"))
(modules '((guix build utils)))
(patches
(search-patches "python-vega-datasets-remove-la-riots-code.patch"))))
(build-system pyproject-build-system)
(arguments
(list #:phases
#~(modify-phases %standard-phases
(add-after 'unpack 'remove-la-riots-dataset
;; Remove dataset with unclear license.
(lambda _
(delete-file "vega_datasets/_data/la-riots.csv"))))))
(native-inputs (list python-pytest))
(propagated-inputs (list python-pandas))
(home-page "https://github.com/altair-viz/vega_datasets")
(synopsis "Example datasets used by Vega-related projects")
(description "This package provides a collection of datasets used in Vega
and Vega-Lite examples.")
(license license:expat)))
(define-public python-hdmedians (define-public python-hdmedians
(package (package
(name "python-hdmedians") (name "python-hdmedians")