82 lines
1.8 KiB
Nix
82 lines
1.8 KiB
Nix
{
|
|
buildPythonPackage,
|
|
fetchPypi,
|
|
fetchpatch,
|
|
lib,
|
|
|
|
# build-system
|
|
cython,
|
|
pkg-config,
|
|
setuptools,
|
|
|
|
# native dependencies
|
|
leptonica,
|
|
tesseract4,
|
|
|
|
# dependencies
|
|
pillow,
|
|
|
|
# tests
|
|
unittestCheckHook,
|
|
}:
|
|
|
|
buildPythonPackage rec {
|
|
pname = "tesserocr";
|
|
version = "2.8.0";
|
|
format = "setuptools";
|
|
|
|
src = fetchPypi {
|
|
inherit pname version;
|
|
hash = "sha256-vlGNGxtf9UwRqtoeD9EpQlCepwWB4KizmipHOgstvTY=";
|
|
};
|
|
|
|
patches = [
|
|
# Fix a broken test. The issue has been reported upstream at
|
|
# https://github.com/sirfz/tesserocr/issues/363
|
|
# Check the status of the issue before removing this patch at the next
|
|
# update.
|
|
(fetchpatch {
|
|
url = "https://github.com/sirfz/tesserocr/commit/78d9e8187bd4d282d572bd5221db2c69e560e017.patch";
|
|
hash = "sha256-s51s9EIV9AZT6UoqwTuQ8lOjToqwIIUkDLjsvCsyYFU=";
|
|
})
|
|
];
|
|
|
|
# https://github.com/sirfz/tesserocr/issues/314
|
|
postPatch = ''
|
|
sed -i '/allheaders.h/a\ pass\n\ncdef extern from "leptonica/pix_internal.h" nogil:' tesserocr/tesseract.pxd
|
|
|
|
substituteInPlace setup.py \
|
|
--replace-fail "Cython>=0.23,<3.1.0" Cython
|
|
'';
|
|
|
|
build-system = [
|
|
cython
|
|
pkg-config
|
|
setuptools
|
|
];
|
|
|
|
buildInputs = [
|
|
leptonica
|
|
tesseract4
|
|
];
|
|
|
|
dependencies = [ pillow ];
|
|
|
|
pythonImportsCheck = [ "tesserocr" ];
|
|
|
|
nativeCheckInputs = [ unittestCheckHook ];
|
|
|
|
preCheck = ''
|
|
rm -rf tesserocr
|
|
'';
|
|
|
|
meta = {
|
|
changelog = "https://github.com/sirfz/tesserocr/releases/tag/v${version}";
|
|
description = "Simple, Pillow-friendly, wrapper around the tesseract-ocr API for Optical Character Recognition (OCR)";
|
|
homepage = "https://github.com/sirfz/tesserocr";
|
|
license = lib.licenses.mit;
|
|
maintainers = with lib.maintainers; [ mtrsk ];
|
|
platforms = lib.platforms.unix;
|
|
};
|
|
}
|