summary refs log tree commit diff
path: root/pkgs
diff options
context:
space:
mode:
authorMaximilian Bosch <maximilian@mbosch.me>2018-11-16 18:44:07 +0100
committerFrederik Rietdijk <freddyrietdijk@fridh.nl>2018-11-22 12:22:08 +0100
commit76ad975840904c509df250d38b131ef7b052eba2 (patch)
tree2b072b135d635fd91853376540b16964e18ab311 /pkgs
parent609316716483bb52489bc9a616da6d5afc0509eb (diff)
downloadnixpkgs-76ad975840904c509df250d38b131ef7b052eba2.tar
nixpkgs-76ad975840904c509df250d38b131ef7b052eba2.tar.gz
nixpkgs-76ad975840904c509df250d38b131ef7b052eba2.tar.bz2
nixpkgs-76ad975840904c509df250d38b131ef7b052eba2.tar.lz
nixpkgs-76ad975840904c509df250d38b131ef7b052eba2.tar.xz
nixpkgs-76ad975840904c509df250d38b131ef7b052eba2.tar.zst
nixpkgs-76ad975840904c509df250d38b131ef7b052eba2.zip
pythonPackages.pytesseract: init at 0.2.5
Simple python wrapper for Tesseract, an OCR engine to detect and read
text from images.

See https://pypi.org/project/pytesseract/
Diffstat (limited to 'pkgs')
-rw-r--r--pkgs/development/python-modules/pytesseract/default.nix31
-rw-r--r--pkgs/development/python-modules/pytesseract/tesseract-binary.patch13
-rw-r--r--pkgs/top-level/python-packages.nix2
3 files changed, 46 insertions, 0 deletions
diff --git a/pkgs/development/python-modules/pytesseract/default.nix b/pkgs/development/python-modules/pytesseract/default.nix
new file mode 100644
index 00000000000..7d96f4d39bd
--- /dev/null
+++ b/pkgs/development/python-modules/pytesseract/default.nix
@@ -0,0 +1,31 @@
+{ buildPythonPackage, fetchPypi, lib, pillow, tesseract, substituteAll }:
+
+buildPythonPackage rec {
+  pname = "pytesseract";
+  version = "0.2.5";
+
+  src = fetchPypi {
+    inherit pname version;
+    sha256 = "0wlz1vbg1k8cdrpzvrahjnbsfs4ki6xqhbkv17ycfchh7h6kfkfm";
+  };
+
+  patches = [
+    (substituteAll {
+      src = ./tesseract-binary.patch;
+      drv = "${tesseract}";
+    })
+  ];
+
+  buildInputs = [ tesseract ];
+  propagatedBuildInputs = [ pillow ];
+
+  # the package doesn't have any tests.
+  doCheck = false;
+
+  meta = with lib; {
+    homepage = https://pypi.org/project/pytesseract/;
+    license = licenses.gpl3;
+    description = "A Python wrapper for Google Tesseract";
+    maintainers = with maintainers; [ ma27 ];
+  };
+}
diff --git a/pkgs/development/python-modules/pytesseract/tesseract-binary.patch b/pkgs/development/python-modules/pytesseract/tesseract-binary.patch
new file mode 100644
index 00000000000..f7eb9fb1d42
--- /dev/null
+++ b/pkgs/development/python-modules/pytesseract/tesseract-binary.patch
@@ -0,0 +1,13 @@
+diff --git a/src/pytesseract.py b/src/pytesseract.py
+index 32713cf..5f9209d 100755
+--- a/src/pytesseract.py
++++ b/src/pytesseract.py
+@@ -25,7 +25,7 @@ if numpy_installed:
+     from numpy import ndarray
+ 
+ # CHANGE THIS IF TESSERACT IS NOT IN YOUR PATH, OR IS NAMED DIFFERENTLY
+-tesseract_cmd = 'tesseract'
++tesseract_cmd = '@drv@/bin/tesseract'
+ RGB_MODE = 'RGB'
+ OSD_KEYS = {
+     'Page number': ('page_num', int),
diff --git a/pkgs/top-level/python-packages.nix b/pkgs/top-level/python-packages.nix
index 726c6f3b58b..f1f3021d79b 100644
--- a/pkgs/top-level/python-packages.nix
+++ b/pkgs/top-level/python-packages.nix
@@ -609,6 +609,8 @@ in {
 
   pystache = callPackage ../development/python-modules/pystache { };
 
+  pytesseract = callPackage ../development/python-modules/pytesseract { };
+
   pytest-tornado = callPackage ../development/python-modules/pytest-tornado { };
 
   python-binance = callPackage ../development/python-modules/python-binance { };