blob: 3c79cf61a16a54e2897c908ace177ea9ed1ff414 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
|
{
lib,
stdenv,
fetchFromGitHub,
buildPythonPackage,
setuptools,
regex,
}:
buildPythonPackage rec {
pname = "somajo";
version = "2.4.3";
pyproject = true;
src = fetchFromGitHub {
owner = "tsproisl";
repo = "SoMaJo";
tag = "v${version}";
hash = "sha256-fq891LX6PukUEfrXplulhnisuPX/RqLAQ/5ty/Fvm9k=";
};
build-system = [ setuptools ];
dependencies = [ regex ];
# loops forever
doCheck = !stdenv.hostPlatform.isDarwin;
pythonImportsCheck = [ "somajo" ];
meta = {
description = "Tokenizer and sentence splitter for German and English web texts";
homepage = "https://github.com/tsproisl/SoMaJo";
changelog = "https://github.com/tsproisl/SoMaJo/blob/v${version}/CHANGES.txt";
license = lib.licenses.gpl3Plus;
maintainers = [ ];
mainProgram = "somajo-tokenizer";
};
}
|