1{ lib
2, stdenv
3, fetchFromGitHub
4, buildPythonPackage
5, pythonOlder
6, setuptools
7, regex
8}:
9
10buildPythonPackage rec {
11 pname = "somajo";
12 version = "2.3.1";
13 pyproject = true;
14
15 disabled = pythonOlder "3.7";
16
17 src = fetchFromGitHub {
18 owner = "tsproisl";
19 repo = "SoMaJo";
20 rev = "refs/tags/v${version}";
21 hash = "sha256-3A2et4pl92LsRtEx2Ki8Soz3n1nZEGQGPc3ZIBDojNM=";
22 };
23
24 nativeBuildInputs = [
25 setuptools
26 ];
27
28 propagatedBuildInputs = [
29 regex
30 ];
31
32 # loops forever
33 doCheck = !stdenv.isDarwin;
34
35 pythonImportsCheck = [
36 "somajo"
37 ];
38
39 meta = with lib; {
40 description = "Tokenizer and sentence splitter for German and English web texts";
41 homepage = "https://github.com/tsproisl/SoMaJo";
42 license = licenses.gpl3Plus;
43 maintainers = with maintainers; [ ];
44 };
45}