1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
|
{
lib,
stdenv,
buildPythonPackage,
fetchFromGitHub,
# build-system
hatchling,
poetry-core,
# dependencies
docling,
pydantic-settings,
typer,
boto3,
pandas,
fastparquet,
pyarrow,
httpx,
# optional dependencies
ray,
rq,
msgpack,
# tests
pytestCheckHook,
pytest-asyncio,
writableTmpDirAsHomeHook,
}:
buildPythonPackage rec {
pname = "docling-jobkit";
version = "1.5.0";
pyproject = true;
src = fetchFromGitHub {
owner = "docling-project";
repo = "docling-jobkit";
tag = "v${version}";
hash = "sha256-/rFMP5KiWHBsGaA2LVOWP2TkJLVeguIlrmO+JL610hQ=";
};
build-system = [
hatchling
poetry-core
];
dependencies = [
docling
pydantic-settings
typer
boto3
pandas
fastparquet
pyarrow
httpx
];
optional-dependencies = {
ray = [ ray ];
rq = [
rq
msgpack
];
};
pythonRelaxDeps = [
"boto3"
"pandas"
"pyarrow"
];
pythonImportsCheck = [
"docling"
"docling_jobkit"
];
nativeCheckInputs = [
pytestCheckHook
pytest-asyncio
writableTmpDirAsHomeHook
]
++ optional-dependencies.rq;
disabledTests = [
# requires network access
"test_chunk_file"
"test_convert_file"
"test_convert_warmup"
"test_convert_url"
"test_replicated_convert"
]
++ lib.optionals stdenv.hostPlatform.isDarwin [
# Flaky due to comparison with magic object
# https://github.com/docling-project/docling-jobkit/issues/45
"test_options_validator"
];
meta = {
changelog = "https://github.com/docling-project/docling-jobkit/blob/${src.tag}/CHANGELOG.md";
description = "Running a distributed job processing documents with Docling";
homepage = "https://github.com/docling-project/docling-jobkit";
license = lib.licenses.mit;
maintainers = with lib.maintainers; [ codgician ];
};
}
|