summaryrefslogtreecommitdiff
path: root/pkgs/servers/sql/postgresql/ext/apache_datasketches.nix
blob: d215a5467bcff3404131741952404f015279ff8e (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
{
  boost186,
  fetchFromGitHub,
  fetchpatch,
  lib,
  postgresql,
  postgresqlBuildExtension,
  postgresqlTestExtension,
}:

let
  version = "1.7.0";

  main_src = fetchFromGitHub {
    name = "datasketches-postgresql";
    owner = "apache";
    repo = "datasketches-postgresql";
    tag = version;
    hash = "sha256-W41uAs3W4V7c9O/wBw3rut65bcmY8EdQS1/tPszMGqA=";
  };

  cpp_src = fetchFromGitHub {
    name = "datasketches-cpp";
    owner = "apache";
    repo = "datasketches-cpp";
    tag = "5.2.0";
    hash = "sha256-h4+cln01jqLV0EpIqScpCyw8jxZgoVtdfBEjdvyUuVk=";
  };
in

postgresqlBuildExtension (finalAttrs: {
  pname = "apache_datasketches";
  inherit version;

  srcs = [
    main_src
    cpp_src
  ];

  sourceRoot = main_src.name;

  # fails to build with boost 1.87
  buildInputs = [ boost186 ];

  patches = [
    # https://github.com/apache/datasketches-cpp/pull/500
    (fetchpatch {
      url = "https://github.com/apache/datasketches-cpp/commit/639134f6e88483bd1bfca451cf09d243ade9bdd4.patch";
      hash = "sha256-6SYKy3NycYABnUCuLUXQz+mTx4VaeWMlHnJ6aM+sNt4=";
      stripLen = 1;
      extraPrefix = "datasketches-cpp/";
    })
  ];

  prePatch = ''
    cp --no-preserve=mode -r ../${cpp_src.name} .
  '';

  enableUpdateScript = false;
  passthru.tests.extension = postgresqlTestExtension {
    inherit (finalAttrs) finalPackage;
    sql = ''
      CREATE EXTENSION datasketches;
      SELECT hll_sketch_to_string(hll_sketch_build(1));
    '';
  };

  meta = {
    description = "PostgreSQL extension providing approximate algorithms for distinct item counts, quantile estimation and frequent items detection";
    longDescription = ''
      apache_datasketches is an extension to support approximate algorithms on PostgreSQL. The implementation
      is based on the Apache Datasketches CPP library, and provides support for HyperLogLog,
      Compressed Probabilistic Counting, KLL, Frequent strings, and Theta sketches.
    '';
    homepage = "https://datasketches.apache.org/";
    platforms = postgresql.meta.platforms;
    license = lib.licenses.asl20;
    maintainers = with lib.maintainers; [ mmusnjak ];
  };
})