27 tensorflow-probability,
33 bsuite = buildPythonPackage rec {
38 disabled = pythonOlder "3.7";
41 inherit pname version;
42 hash = "sha256-ak9McvXl7Nz5toUaPaRaJek9lurxiQiIW209GnZEjX0=";
46 # Convert np.int -> np.int32 since np.int is deprecated, https://github.com/google-deepmind/bsuite/pull/48
48 url = "https://github.com/google-deepmind/bsuite/pull/48/commits/f8d81b2f1c27ef2c8c71ae286001ed879ea306ab.patch";
49 hash = "sha256-FXtvVS+U8brulq8Z27+yWIimB+kigGiUOIv1SHb1TA8=";
51 # Replace imp with importlib, https://github.com/google-deepmind/bsuite/pull/50
53 name = "replace-imp.patch";
54 url = "https://github.com/google-deepmind/bsuite/commit/d08b63655c7efa5b5bb0f35e825e17549d23e812.patch";
55 hash = "sha256-V5p/6edNXTpEckuSuxJ/mvfJng5yE/pfeMoYbvlNpEo=";
59 build-system = [ setuptools ];
85 tensorflow-probability
89 pythonImportsCheck = [ "bsuite" ];
92 # Tests require network connection
94 "test_longer_action_sequence"
96 "test_step_after_reset"
97 "test_step_on_fresh_environment"
98 "test_longer_action_sequence"
100 "test_step_after_reset"
101 "test_step_on_fresh_environment"
102 "test_longer_action_sequence"
104 "test_step_after_reset"
105 "test_step_on_fresh_environment"
107 "test_episode_truncation"
110 # Escape infinite recursion with rlax
114 check = bsuite.overridePythonAttrs (_: {
120 description = "Collection of experiments that investigate core capabilities of a reinforcement learning (RL) agent";
121 homepage = "https://github.com/deepmind/bsuite";
122 changelog = "https://github.com/google-deepmind/bsuite/releases/tag/${version}";
123 license = licenses.asl20;
124 maintainers = with maintainers; [ onny ];