1{ lib
2, buildPythonPackage
3, distro
4, fetchFromGitHub
5, jdk
6, numpy
7, pandas
8, pytestCheckHook
9, pythonOlder
10, setuptools-scm
11}:
12
13buildPythonPackage rec {
14 pname = "tabula-py";
15 version = "2.5.1";
16 format = "setuptools";
17
18 disabled = pythonOlder "3.7";
19
20 src = fetchFromGitHub {
21 owner = "chezou";
22 repo = pname;
23 rev = "v${version}";
24 hash = "sha256-Dfi6LzrLDz9VVDmbeK1dEaWuQosD4tvAH13Q4Mp3smA=";
25 };
26
27 SETUPTOOLS_SCM_PRETEND_VERSION = version;
28
29 nativeBuildInputs = [
30 setuptools-scm
31 ];
32
33 propagatedBuildInputs = [
34 distro
35 numpy
36 pandas
37 ];
38
39 checkInputs = [
40 jdk
41 pytestCheckHook
42 ];
43
44 pythonImportsCheck = [
45 "tabula"
46 ];
47
48 disabledTests = [
49 # Tests require network access
50 "test_convert_remote_file"
51 "test_read_pdf_with_remote_template"
52 "test_read_remote_pdf"
53 "test_read_remote_pdf_with_custom_user_agent"
54 ];
55
56 meta = with lib; {
57 description = "Module to extract table from PDF into pandas DataFrame";
58 homepage = "https://github.com/chezou/tabula-py";
59 license = licenses.mit;
60 maintainers = with maintainers; [ fab ];
61 };
62}