5 # propagated build inputs
24 # optional-dependencies
30 unstructured-inference,
40 google-api-python-client,
61 optional-dependencies = {
69 local-inference = [ unstructured-inference ];
78 discord = [ ]; # discord-py
79 github = [ pygithub ];
80 gitlab = [ python-gitlab ];
82 slack = [ slack-sdk ];
83 wikipedia = [ wikipedia ];
84 google-drive = [ google-api-python-client ];
85 gcs = [ ]; # gcsfs fsspec
90 dropbox = [ ]; # dropboxdrivefs fsspec
91 confluence = [ atlassian-python-api ];
95 pname = "unstructured";
97 format = "setuptools";
99 src = fetchFromGitHub {
100 owner = "Unstructured-IO";
101 repo = "unstructured";
102 rev = "refs/tags/${version}";
103 hash = "sha256-cIMKaSKG4T832rpiJeiwftqVrcMezD9ICfislGPV/TQ=";
106 propagatedBuildInputs = [
127 pythonImportsCheck = [ "unstructured" ];
129 # test try to download punkt from nltk
130 # figure out how to make it available to enable the tests
133 nativeCheckInputs = [
146 optional-dependencies = optional-dependencies;
149 description = "Open source libraries and APIs to build custom preprocessing pipelines for labeling, training, or production machine learning pipelines";
150 mainProgram = "unstructured-ingest";
151 homepage = "https://github.com/Unstructured-IO/unstructured";
152 changelog = "https://github.com/Unstructured-IO/unstructured/blob/${version}/CHANGELOG.md";
153 license = licenses.asl20;
154 maintainers = with maintainers; [ happysalada ];