summaryrefslogtreecommitdiff
path: root/pkgs/development/python-modules/hdbscan/default.nix
blob: 0312436eaf95b1cc7656fe0a5ae5eed4cf9e5e55 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
{
  lib,
  buildPythonPackage,
  fetchFromGitHub,
  fetchpatch,

  cython,
  numpy,
  scipy,
  scikit-learn,
  joblib,
  six,

  # test
  pytestCheckHook,
}:

buildPythonPackage rec {
  pname = "hdbscan";
  version = "0.8.40";
  format = "setuptools";

  src = fetchFromGitHub {
    owner = "scikit-learn-contrib";
    repo = "hdbscan";
    tag = "release-${version}";
    hash = "sha256-xsBlmSQU47e+M+nRqUXdWKS7Rtj2QZ1UWLAvjSQOJ0Q=";
  };

  patches = [
    (fetchpatch {
      # Replace obsolete use of assert_raises with pytest.raises
      name = "replace-assert_raises";
      url = "https://github.com/scikit-learn-contrib/hdbscan/pull/667/commits/04d6a4dcdcd2bb2597419b8aa981d7620765809f.patch";
      hash = "sha256-z/u5b2rNPKOCe+3/GVE8rMB5ajeU5PrvLVesjEgj9TA=";
    })
  ];

  pythonRemoveDeps = [ "cython" ];

  nativeBuildInputs = [
    cython
    joblib
    numpy
    scikit-learn
    scipy
    six
  ];

  preCheck = ''
    cd hdbscan/tests
    rm __init__.py
  '';

  nativeCheckInputs = [ pytestCheckHook ];

  disabledTests = [
    # known flaky tests: https://github.com/scikit-learn-contrib/hdbscan/issues/420
    "test_mem_vec_diff_clusters"
    "test_all_points_mem_vec_diff_clusters"
    "test_approx_predict_diff_clusters"
    # another flaky test https://github.com/scikit-learn-contrib/hdbscan/issues/421
    "test_hdbscan_boruvka_balltree_matches"
    # more flaky tests https://github.com/scikit-learn-contrib/hdbscan/issues/570
    "test_hdbscan_boruvka_balltree"
    "test_hdbscan_best_balltree_metric"
    # "got an unexpected keyword argument"
    "test_hdbscan_badargs"
  ];

  disabledTestPaths = [
    # joblib.externals.loky.process_executor.BrokenProcessPool:
    "test_branches.py"
  ];

  pythonImportsCheck = [ "hdbscan" ];

  meta = {
    description = "Hierarchical Density-Based Spatial Clustering of Applications with Noise, a clustering algorithm with a scikit-learn compatible API";
    homepage = "https://github.com/scikit-learn-contrib/hdbscan";
    changelog = "https://github.com/scikit-learn-contrib/hdbscan/releases/tag/release-${version}";
    license = lib.licenses.bsd3;
    maintainers = [ ];
  };
}