python312Packages.docling: 2.23.0 -> 2.25.1 (#386660)

authored by Yt and committed by GitHub af0c7c75 7768e6b9

+45 -26
+29 -21
pkgs/development/python-modules/docling-ibm-models/default.nix
··· 2 lib, 3 buildPythonPackage, 4 fetchFromGitHub, 5 poetry-core, 6 # dependencies 7 - torch, 8 - torchvision, 9 - transformers, 10 huggingface-hub, 11 jsonlines, 12 numpy, 13 opencv-python-headless, 14 pillow, 15 tqdm, 16 - safetensors, 17 pytestCheckHook, 18 }: 19 20 buildPythonPackage rec { 21 pname = "docling-ibm-models"; 22 - version = "3.3.2"; 23 pyproject = true; 24 25 src = fetchFromGitHub { 26 owner = "DS4SD"; 27 repo = "docling-ibm-models"; 28 tag = "v${version}"; 29 - hash = "sha256-8mqDgbTj5g6jXEumj16Me9NjHLCOdR+pXmAwn2dghfg="; 30 }; 31 32 build-system = [ ··· 34 ]; 35 36 dependencies = [ 37 - torch 38 - torchvision 39 - transformers 40 - numpy 41 jsonlines 42 pillow 43 tqdm 44 - opencv-python-headless 45 - huggingface-hub 46 - safetensors 47 ]; 48 49 pythonRelaxDeps = [ 50 - "pillow" 51 - "torchvision" 52 "transformers" 53 "numpy" 54 ]; ··· 58 ]; 59 60 nativeCheckInputs = [ 61 pytestCheckHook 62 ]; 63 64 - preCheck = '' 65 - export HOME="$TEMPDIR" 66 - ''; 67 - 68 disabledTests = [ 69 # Requires network access 70 - "test_layoutpredictor" 71 - "test_tf_predictor" 72 "test_code_formula_predictor" # huggingface_hub.errors.LocalEntryNotFoundError 73 "test_figure_classifier" # huggingface_hub.errors.LocalEntryNotFoundError 74 ]; 75 76 meta = {
··· 2 lib, 3 buildPythonPackage, 4 fetchFromGitHub, 5 + 6 + # build-system 7 poetry-core, 8 + 9 # dependencies 10 + docling-core, 11 huggingface-hub, 12 jsonlines, 13 numpy, 14 opencv-python-headless, 15 pillow, 16 + pydantic, 17 + safetensors, 18 + torch, 19 + torchvision, 20 tqdm, 21 + transformers, 22 + 23 + # tests 24 + datasets, 25 pytestCheckHook, 26 + writableTmpDirAsHomeHook, 27 }: 28 29 buildPythonPackage rec { 30 pname = "docling-ibm-models"; 31 + version = "3.4.1"; 32 pyproject = true; 33 34 src = fetchFromGitHub { 35 owner = "DS4SD"; 36 repo = "docling-ibm-models"; 37 tag = "v${version}"; 38 + hash = "sha256-IgKP+4en0N6xLBjzwmddDk8z5P3J1vo+UMW+65a01Ww="; 39 }; 40 41 build-system = [ ··· 43 ]; 44 45 dependencies = [ 46 + docling-core 47 + huggingface-hub 48 jsonlines 49 + numpy 50 + opencv-python-headless 51 pillow 52 + pydantic 53 + safetensors 54 + torch 55 + torchvision 56 tqdm 57 + transformers 58 ]; 59 60 pythonRelaxDeps = [ 61 "transformers" 62 "numpy" 63 ]; ··· 67 ]; 68 69 nativeCheckInputs = [ 70 + datasets 71 pytestCheckHook 72 + writableTmpDirAsHomeHook 73 ]; 74 75 disabledTests = [ 76 # Requires network access 77 "test_code_formula_predictor" # huggingface_hub.errors.LocalEntryNotFoundError 78 "test_figure_classifier" # huggingface_hub.errors.LocalEntryNotFoundError 79 + "test_layoutpredictor" 80 + "test_readingorder" 81 + "test_tf_predictor" 82 ]; 83 84 meta = {
+16 -5
pkgs/development/python-modules/docling/default.nix
··· 9 # dependencies 10 beautifulsoup4, 11 certifi, 12 - deepsearch-glm, 13 docling-core, 14 docling-ibm-models, 15 docling-parse, ··· 49 50 buildPythonPackage rec { 51 pname = "docling"; 52 - version = "2.23.0"; 53 pyproject = true; 54 55 src = fetchFromGitHub { 56 owner = "DS4SD"; 57 repo = "docling"; 58 tag = "v${version}"; 59 - hash = "sha256-ySywKaLxjtgQM7RtzJrxZDS3z8uMwAwPDYO51uKHT28="; 60 }; 61 62 build-system = [ ··· 66 dependencies = [ 67 beautifulsoup4 68 certifi 69 - deepsearch-glm 70 docling-core 71 docling-ibm-models 72 docling-parse ··· 133 "test_e2e_pdfs_conversions" # AssertionError: ## TableFormer: Table Structure Understanding with Transf 134 "test_e2e_conversions" # RuntimeError: Tesseract is not available 135 136 # huggingface_hub.errors.LocalEntryNotFoundError: An error happened 137 "test_cli_convert" 138 "test_code_and_formula_conversion" ··· 152 meta = { 153 description = "Get your documents ready for gen AI"; 154 homepage = "https://github.com/DS4SD/docling"; 155 - changelog = "https://github.com/DS4SD/docling/blob/${src.rev}/CHANGELOG.md"; 156 license = lib.licenses.mit; 157 maintainers = with lib.maintainers; [ happysalada ]; 158 mainProgram = "docling";
··· 9 # dependencies 10 beautifulsoup4, 11 certifi, 12 docling-core, 13 docling-ibm-models, 14 docling-parse, ··· 48 49 buildPythonPackage rec { 50 pname = "docling"; 51 + version = "2.25.1"; 52 pyproject = true; 53 54 src = fetchFromGitHub { 55 owner = "DS4SD"; 56 repo = "docling"; 57 tag = "v${version}"; 58 + hash = "sha256-uJZIwXVwGd9xDBQkZ/uz2XLJ+lL1ZAZHJv/jHtW/LCk="; 59 }; 60 61 build-system = [ ··· 65 dependencies = [ 66 beautifulsoup4 67 certifi 68 docling-core 69 docling-ibm-models 70 docling-parse ··· 131 "test_e2e_pdfs_conversions" # AssertionError: ## TableFormer: Table Structure Understanding with Transf 132 "test_e2e_conversions" # RuntimeError: Tesseract is not available 133 134 + # AssertionError 135 + # assert doc.export_to_markdown() == pair[1], f"Error in case {idx}" 136 + "test_ordered_lists" 137 + 138 + # AssertionError: export to md 139 + "test_e2e_html_conversions" 140 + 141 + # AssertionError: assert 'Unordered li...d code block:' == 'Unordered li...d code block:' 142 + "test_convert_valid" 143 + 144 + # AssertionError: Markdown file mismatch against groundtruth pftaps057006474.md 145 + "test_patent_groundtruth" 146 + 147 # huggingface_hub.errors.LocalEntryNotFoundError: An error happened 148 "test_cli_convert" 149 "test_code_and_formula_conversion" ··· 163 meta = { 164 description = "Get your documents ready for gen AI"; 165 homepage = "https://github.com/DS4SD/docling"; 166 + changelog = "https://github.com/DS4SD/docling/blob/v${version}/CHANGELOG.md"; 167 license = lib.licenses.mit; 168 maintainers = with lib.maintainers; [ happysalada ]; 169 mainProgram = "docling";