summaryrefslogtreecommitdiff
path: root/pkgs/development/python-modules/cltk/default.nix
blob: 398ed15ca387c1cc9cec129fd7ad6aebb8d285a6 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
{
  lib,
  buildPythonPackage,
  fetchFromGitHub,

  # build-system
  poetry-core,

  # dependencies
  boltons,
  gensim,
  gitpython,
  greek-accentuation,
  nltk,
  pyyaml,
  rapidfuzz,
  requests,
  scikit-learn,
  scipy,
  spacy,
  stanza,
  torch,
  tqdm,
  colorama,
  python-dotenv,

  # tests
  pytestCheckHook,
  writableTmpDirAsHomeHook,
}:
buildPythonPackage rec {
  pname = "cltk";
  version = "2.0.4";
  pyproject = true;

  src = fetchFromGitHub {
    owner = "cltk";
    repo = "cltk";
    tag = "v${version}";
    hash = "sha256-tAomXxI6XsIAxQzPiUsT5t1CHrFDPkwyWtVuHXQCz2A=";
  };

  build-system = [ poetry-core ];

  pythonRelaxDeps = [
    "spacy"
  ];

  dependencies = [
    boltons
    gensim
    gitpython
    greek-accentuation
    nltk
    pyyaml
    rapidfuzz
    requests
    scikit-learn
    scipy
    spacy
    stanza
    torch
    tqdm
    colorama
    python-dotenv
  ];

  nativeCheckInputs = [
    pytestCheckHook
    writableTmpDirAsHomeHook
  ];

  # Most of tests fail as they require local files to be present and also internet access
  doCheck = false;

  meta = {
    description = "Natural language processing (NLP) framework for pre-modern languages";
    homepage = "https://cltk.org";
    changelog = "https://github.com/cltk/cltk/releases/tag/v${version}";
    license = lib.licenses.mit;
    maintainers = with lib.maintainers; [ kmein ];
  };
}