20 testNltkData = symlinkJoin {
21 name = "nltk-test-data";
28 buildPythonPackage rec {
29 pname = "dataprep-ml";
33 disabled = pythonOlder "3.8";
35 # using PyPI as github repo does not contain tags or release branches
37 pname = "dataprep_ml";
39 hash = "sha256-pZhHlNcQJLBww7ur2Z6Yb2IdbRsBtjzQAzfa4UzGKt4=";
42 pythonRelaxDeps = [ "pydantic" ];
48 propagatedBuildInputs = [
60 # PyPI tarball has no tests
63 # Package import requires NLTK data to be downloaded
64 # It is the only way to set NLTK_DATA environment variable,
65 # so that it is available in pythonImportsCheck
66 env.NLTK_DATA = testNltkData;
67 pythonImportsCheck = [
69 "dataprep_ml.cleaners"
71 "dataprep_ml.imputers"
72 "dataprep_ml.insights"
73 "dataprep_ml.recommenders"
74 "dataprep_ml.splitters"
78 description = "Data utilities for Machine Learning pipelines";
79 homepage = "https://github.com/mindsdb/dataprep_ml";
80 license = licenses.gpl3Only;
81 maintainers = with maintainers; [ mbalatsko ];