summary refs log tree commit diff
path: root/pkgs/development/python-modules/datasets/default.nix
diff options
context:
space:
mode:
authorDaniƫl de Kok <me@danieldk.eu>2020-09-10 20:18:22 +0200
committerJon <jonringer@users.noreply.github.com>2020-09-10 16:06:40 -0700
commit1839c5cd7b85a5b5bc4586d9bc0b1d9439d34b81 (patch)
tree48338d46621cbdd060ee4a8a575144800e426b0f /pkgs/development/python-modules/datasets/default.nix
parent9627ae4f9a9ac84268fc46337a3069df4215a0df (diff)
downloadnixpkgs-1839c5cd7b85a5b5bc4586d9bc0b1d9439d34b81.tar
nixpkgs-1839c5cd7b85a5b5bc4586d9bc0b1d9439d34b81.tar.gz
nixpkgs-1839c5cd7b85a5b5bc4586d9bc0b1d9439d34b81.tar.bz2
nixpkgs-1839c5cd7b85a5b5bc4586d9bc0b1d9439d34b81.tar.lz
nixpkgs-1839c5cd7b85a5b5bc4586d9bc0b1d9439d34b81.tar.xz
nixpkgs-1839c5cd7b85a5b5bc4586d9bc0b1d9439d34b81.tar.zst
nixpkgs-1839c5cd7b85a5b5bc4586d9bc0b1d9439d34b81.zip
python3Packages.datasets: init at 1.0.0
This library provides open-access datasets an evaluation metrics for
natural language processing using PyTorch, TensorFlow, NumPy, and
Pandas.
Diffstat (limited to 'pkgs/development/python-modules/datasets/default.nix')
-rw-r--r--pkgs/development/python-modules/datasets/default.nix52
1 files changed, 52 insertions, 0 deletions
diff --git a/pkgs/development/python-modules/datasets/default.nix b/pkgs/development/python-modules/datasets/default.nix
new file mode 100644
index 00000000000..4bddd69ed99
--- /dev/null
+++ b/pkgs/development/python-modules/datasets/default.nix
@@ -0,0 +1,52 @@
+{ lib
+, buildPythonPackage
+, fetchFromGitHub
+, dill
+, filelock
+, numpy
+, pandas
+, pyarrow
+, requests
+, tqdm
+, xxhash
+}:
+
+buildPythonPackage rec {
+  pname = "datasets";
+  version = "1.0.0";
+
+  src = fetchFromGitHub {
+    owner = "huggingface";
+    repo = pname;
+    rev = version;
+    sha256 = "13l52r7nhj2c1a10isy5309d2g6pmaivyqs5w6yjbjj4195jxya5";
+  };
+
+  propagatedBuildInputs = [
+    dill
+    filelock
+    numpy
+    pandas
+    pyarrow
+    requests
+    tqdm
+    xxhash
+  ];
+
+  # Tests require pervasive internet access.
+  doCheck = false;
+
+  # Module import will attempt to create a cache directory.
+  postFixup = "export HF_MODULES_CACHE=$TMPDIR";
+
+  pythonImportsCheck = [ "datasets" ];
+
+  meta = with lib; {
+    homepage = "https://github.com/huggingface/datasets";
+    description = "Fast, efficient, open-access datasets and evaluation metrics for natural language processing";
+    changelog = "https://github.com/huggingface/datasets/releases/tag/${version}";
+    license = licenses.asl20;
+    platforms = platforms.unix;
+    maintainers = with maintainers; [ danieldk ];
+  };
+}