From 6d2fef9b79d2aa6b497fb52a0eb0d050fe471429 Mon Sep 17 00:00:00 2001 From: Martijn Visser Date: Fri, 15 Dec 2023 17:32:13 +0100 Subject: [PATCH 1/3] Fix and change table sorting in Python --- docs/core/usage.qmd | 34 ++++++++++++------------- python/ribasim/ribasim/config.py | 37 +++++++++++++++++++++++----- python/ribasim/ribasim/input_base.py | 6 ++++- 3 files changed, 53 insertions(+), 24 deletions(-) diff --git a/docs/core/usage.qmd b/docs/core/usage.qmd index 6cf12c20e..0fa1ba0d5 100644 --- a/docs/core/usage.qmd +++ b/docs/core/usage.qmd @@ -348,8 +348,8 @@ Lets a fraction (in [0,1]) of the incoming flow trough. column | type | unit | restriction ------------- | ------- | ------------ | ----------- node_id | Int | - | sorted +control_state | String | - | (optional) sorted per node_id fraction | Float64 | - | in the interval [0,1] -control_state | String | - | (optional) # TabulatedRatingCurve @@ -359,10 +359,10 @@ relation between the storage of a connected Basin (via the outlet level) and its column | type | unit | restriction ------------- | ------- | ------------ | ----------- node_id | Int | - | sorted +control_state | String | - | (optional) sorted per node_id active | Bool | - | (optional, default true) level | Float64 | $m$ | sorted per control_state discharge | Float64 | $m^3 s^{-1}$ | non-negative -control_state | String | - | (optional) sorted per node_id node_id | discharge | level ------- |----------- |------- @@ -382,8 +382,8 @@ Note that a `node_id` can be either in this table or in the static one, but not column | type | unit | restriction --------- | ------- | ------------ | ----------- -time | DateTime | - | sorted -node_id | Int | - | sorted per time +node_id | Int | - | sorted +time | DateTime | - | sorted per node_id level | Float64 | $m$ | - discharge | Float64 | $m^3 s^{-1}$ | non-negative @@ -398,11 +398,11 @@ When PID controlled, the pump must point away from the controlled basin in terms column | type | unit | restriction --------- | ------- | ------------ | ----------- node_id | Int | - | sorted +control_state | String | - | (optional) sorted per node_id active | Bool | - | (optional, default true) flow_rate | Float64 | $m^3 s^{-1}$ | non-negative min_flow_rate | Float64 | $m^3 s^{-1}$ | (optional, default 0.0) max_flow_rate | Float64 | $m^3 s^{-1}$ | (optional) -control_state | String | - | (optional) # Outlet @@ -412,12 +412,12 @@ When PID controlled, the outlet must point towards the controlled basin in terms column | type | unit | restriction --------- | ------- | ------------ | ----------- node_id | Int | - | sorted +control_state | String | - | (optional) sorted per node_id active | Bool | - | (optional, default true) flow_rate | Float64 | $m^3 s^{-1}$ | non-negative min_flow_rate | Float64 | $m^3 s^{-1}$ | (optional, default 0.0) max_flow_rate | Float64 | $m^3 s^{-1}$ | (optional) min_crest_level | Float64 | $m$ | (optional) -control_state | String | - | (optional) # User @@ -454,11 +454,11 @@ Note that a `node_id` can be either in this table or in the static one, but not column | type | unit | restriction ------------- | -------- | ------------ | ----------- node_id | Int | - | sorted +priority | Int | - | sorted per node id time | DateTime | - | sorted per priority per node id demand | Float64 | $m^3 s^{-1}$ | - return_factor | Float64 | - | between [0 - 1] min_level | Float64 | $m$ | (optional) -priority | Int | - | sorted per node id ## Allocation results @@ -503,8 +503,8 @@ Note that a `node_id` can be either in this table or in the static one, but not column | type | unit | restriction --------- | ------- | ------------ | ----------- -time | DateTime | - | sorted -node_id | Int | - | sorted per time +node_id | Int | - | sorted +time | DateTime | - | sorted per node_id level | Float64 | $m$ | - # FlowBoundary @@ -534,8 +534,8 @@ Note that a `node_id` can be either in this table or in the static one, but not column | type | unit | restriction --------- | ------- | ------------ | ----------- -time | DateTime | - | sorted -node_id | Int | - | sorted per time +node_id | Int | - | sorted +time | DateTime | - | sorted per node_id flow_rate | Float64 | $m^3 s^{-1}$ | non-negative # LinearResistance @@ -545,9 +545,9 @@ Flow proportional to the level difference between the connected basins. column | type | unit | restriction ------------- | ------- | ------------ | ----------- node_id | Int | - | sorted +control_state | String | - | (optional) sorted per node_id active | Bool | - | (optional, default true) resistance | Float64 | $sm^{-2}$ | - -control_state | String | - | (optional) # ManningResistance @@ -556,12 +556,12 @@ Flow through this connection is estimated by conservation of energy and the Mann column | type | unit | restriction ------------- | ------- | ------------ | ----------- node_id | Int | - | sorted +control_state | String | - | (optional) sorted per node_id active | Bool | - | (optional, default true) length | Float64 | $m$ | positive manning_n | Float64 | $s m^{-\frac{1}{3}}$ | positive profile_width | Float64 | $m$ | positive profile_slope | Float64 | - | - -control_state | String | - | (optional) # Terminal @@ -606,8 +606,8 @@ DiscreteControl is applied in the Julia core as follows: column | type | unit | restriction -------------- | -------- | ---- | ----------- node_id | Int | - | sorted +control_state | String | - | sorted per node_id truth_state | String | - | Consists of the characters "T" (true), "F" (false), "U" (upcrossing), "D" (downcrossing) and "*" (any) -control_state | String | - | ## DiscreteControl results @@ -631,13 +631,13 @@ In the future controlling the flow on a particular edge could be supported. column | type | unit | restriction -------------- | -------- | -------- | ----------- node_id | Int | - | sorted +control_state | String | - | (optional) sorted per node_id active | Bool | - | (optional, default true) listen_node_id | Int | - | - target | Float64 | $m$ | - proportional | Float64 | $s^{-1}$ | - integral | Float64 | $s^{-2}$ | - derivative | Float64 | - | - -control_state | String | - | - ## PidControl / time @@ -651,8 +651,8 @@ Note that a `node_id` can be either in this table or in the static one, but not column | type | unit | restriction -------------- | -------- | -------- | ----------- -node_id | Int | - | sorted per time -time | DateTime | - | sorted +node_id | Int | - | sorted +time | DateTime | - | sorted per node_id listen_node_id | Int | - | - target | Float64 | $m$ | - proportional | Float64 | $s^{-1}$ | - diff --git a/python/ribasim/ribasim/config.py b/python/ribasim/ribasim/config.py index ca8983d5f..6bcbf8035 100644 --- a/python/ribasim/ribasim/config.py +++ b/python/ribasim/ribasim/config.py @@ -82,6 +82,8 @@ class Terminal(NodeModel): default_factory=TableModel[TerminalStaticSchema] ) + _sort_keys: dict[str, list[str]] = {"static": ["node_id"]} + class PidControl(NodeModel): static: TableModel[PidControlStaticSchema] = Field( @@ -91,7 +93,10 @@ class PidControl(NodeModel): default_factory=TableModel[PidControlTimeSchema] ) - _sort_keys: dict[str, list[str]] = {"time": ["time", "node_id"]} + _sort_keys: dict[str, list[str]] = { + "static": ["node_id", "control_state"], + "time": ["node_id", "time"], + } class LevelBoundary(NodeModel): @@ -102,7 +107,10 @@ class LevelBoundary(NodeModel): default_factory=TableModel[LevelBoundaryTimeSchema] ) - _sort_keys: dict[str, list[str]] = {"time": ["time", "node_id"]} + _sort_keys: dict[str, list[str]] = { + "static": ["node_id"], + "time": ["node_id", "time"], + } class Pump(NodeModel): @@ -110,6 +118,8 @@ class Pump(NodeModel): default_factory=TableModel[PumpStaticSchema] ) + _sort_keys: dict[str, list[str]] = {"static": ["node_id", "control_state"]} + class TabulatedRatingCurve(NodeModel): static: TableModel[TabulatedRatingCurveStaticSchema] = Field( @@ -119,8 +129,8 @@ class TabulatedRatingCurve(NodeModel): default_factory=TableModel[TabulatedRatingCurveTimeSchema] ) _sort_keys: dict[str, list[str]] = { - "static": ["node_id", "level"], - "time": ["time", "node_id", "level"], + "static": ["node_id", "control_state", "level"], + "time": ["node_id", "time", "level"], } @@ -144,7 +154,10 @@ class FlowBoundary(NodeModel): default_factory=TableModel[FlowBoundaryTimeSchema] ) - _sort_keys: dict[str, list[str]] = {"time": ["time", "node_id"]} + _sort_keys: dict[str, list[str]] = { + "static": ["node_id"], + "time": ["node_id", "time"], + } class Basin(NodeModel): @@ -165,8 +178,9 @@ class Basin(NodeModel): ) _sort_keys: dict[str, list[str]] = { + "static": ["node_id"], "profile": ["node_id", "level"], - "time": ["time", "node_id"], + "time": ["node_id", "time"], "subgrid": ["subgrid_id", "basin_level"], } @@ -176,6 +190,8 @@ class ManningResistance(NodeModel): default_factory=TableModel[ManningResistanceStaticSchema] ) + _sort_keys: dict[str, list[str]] = {"static": ["node_id", "control_state"]} + class DiscreteControl(NodeModel): condition: TableModel[DiscreteControlConditionSchema] = Field( @@ -185,20 +201,29 @@ class DiscreteControl(NodeModel): default_factory=TableModel[DiscreteControlLogicSchema] ) + # TODO complete the ordering, and make sure it aligns with truth_state + _sort_keys: dict[str, list[str]] = {"static": ["node_id"], "logic": ["node_id"]} + class Outlet(NodeModel): static: TableModel[OutletStaticSchema] = Field( default_factory=TableModel[OutletStaticSchema] ) + _sort_keys: dict[str, list[str]] = {"static": ["node_id", "control_state"]} + class LinearResistance(NodeModel): static: TableModel[LinearResistanceStaticSchema] = Field( default_factory=TableModel[LinearResistanceStaticSchema] ) + _sort_keys: dict[str, list[str]] = {"static": ["node_id", "control_state"]} + class FractionalFlow(NodeModel): static: TableModel[FractionalFlowStaticSchema] = Field( default_factory=TableModel[FractionalFlowStaticSchema] ) + + _sort_keys: dict[str, list[str]] = {"static": ["node_id", "control_state"]} diff --git a/python/ribasim/ribasim/input_base.py b/python/ribasim/ribasim/input_base.py index 42958ab75..34073f3ce 100644 --- a/python/ribasim/ribasim/input_base.py +++ b/python/ribasim/ribasim/input_base.py @@ -393,6 +393,10 @@ def set_modeld( content = serializer(self) return dict(filter(lambda x: x[1], content.items())) + @classmethod + def sort_keys(cls, field: str) -> list[str]: + return cls._sort_keys[field] + @classmethod def get_input_type(cls): return cls.__name__ @@ -426,7 +430,7 @@ def _save(self, directory: DirectoryPath, input_dir: DirectoryPath, **kwargs): getattr(self, field)._save( directory, input_dir, - sort_keys=self._sort_keys.get("field", ["node_id"]), + sort_keys=self._sort_keys[field], ) def _repr_content(self) -> str: From 0c9e3f719a34e55ab746c5f6934887ff9fd69536 Mon Sep 17 00:00:00 2001 From: Martijn Visser Date: Tue, 9 Jan 2024 16:30:48 +0100 Subject: [PATCH 2/3] add DiscreteControl sorting, Basing / state sorting --- docs/core/usage.qmd | 14 +++++++------- python/ribasim/ribasim/config.py | 7 +++++-- 2 files changed, 12 insertions(+), 9 deletions(-) diff --git a/docs/core/usage.qmd b/docs/core/usage.qmd index 0fa1ba0d5..73bd3ca21 100644 --- a/docs/core/usage.qmd +++ b/docs/core/usage.qmd @@ -585,9 +585,9 @@ The condition schema defines conditions of the form 'the discrete_control node w column | type | unit | restriction ----------------- | -------- | ------- | ----------- node_id | Int | - | sorted -listen_feature_id | Int | - | - -variable | String | - | must be "level" or "flow_rate" -greater_than | Float64 | various | - +listen_feature_id | Int | - | sorted per node_id +variable | String | - | must be "level" or "flow_rate", sorted per listen_feature_id +greater_than | Float64 | various | sorted per variable look_ahead | Float64 | $s$ | Only on transient boundary conditions, non-negative (optional, default 0) ## DiscreteControl / logic @@ -596,8 +596,8 @@ The logic schema defines which control states are triggered based on the truth o DiscreteControl is applied in the Julia core as follows: - During the simulation it is checked whether the truth of any of the conditions changes. -- When a condition changes, the corresponding discrrete_control node id is retrieved (node_id in the condition schema above). -- The truth value of all the conditions this discrete_control node lisens to are retrieved, in the order as they are specified in the condition schema. This is then converted into a string of "T" for true and "F" for false. This string we call the truth state.* +- When a condition changes, the corresponding discrete_control node id is retrieved (node_id in the condition schema above). +- The truth value of all the conditions this discrete_control node listens to are retrieved, in the order as they are specified in the condition schema. This is then converted into a string of "T" for true and "F" for false. This string we call the truth state.* - The table below determines for the given discrete_control node ID and truth state what the corresponding control state is. - For all the nodes this discrete_control node affects (as given by the "control" edges in [Edges / static](usage.qmd#edge)), their parameters are set to those parameters in `NodeType / static` corresponding to the determined control state. @@ -606,8 +606,8 @@ DiscreteControl is applied in the Julia core as follows: column | type | unit | restriction -------------- | -------- | ---- | ----------- node_id | Int | - | sorted -control_state | String | - | sorted per node_id -truth_state | String | - | Consists of the characters "T" (true), "F" (false), "U" (upcrossing), "D" (downcrossing) and "*" (any) +control_state | String | - | - +truth_state | String | - | Consists of the characters "T" (true), "F" (false), "U" (upcrossing), "D" (downcrossing) and "*" (any), sorted per node_id ## DiscreteControl results diff --git a/python/ribasim/ribasim/config.py b/python/ribasim/ribasim/config.py index 6bcbf8035..e992e811b 100644 --- a/python/ribasim/ribasim/config.py +++ b/python/ribasim/ribasim/config.py @@ -179,6 +179,7 @@ class Basin(NodeModel): _sort_keys: dict[str, list[str]] = { "static": ["node_id"], + "state": ["node_id"], "profile": ["node_id", "level"], "time": ["node_id", "time"], "subgrid": ["subgrid_id", "basin_level"], @@ -201,8 +202,10 @@ class DiscreteControl(NodeModel): default_factory=TableModel[DiscreteControlLogicSchema] ) - # TODO complete the ordering, and make sure it aligns with truth_state - _sort_keys: dict[str, list[str]] = {"static": ["node_id"], "logic": ["node_id"]} + _sort_keys: dict[str, list[str]] = { + "condition": ["node_id", "listen_feature_id", "variable", "greater_than"], + "logic": ["node_id", "truth_state"], + } class Outlet(NodeModel): From d003971bcc79610eb4d4e5b17979d9563d305d1f Mon Sep 17 00:00:00 2001 From: Martijn Visser Date: Fri, 12 Jan 2024 16:26:50 +0100 Subject: [PATCH 3/3] add test --- python/ribasim/ribasim/input_base.py | 11 +++-------- python/ribasim/tests/conftest.py | 5 +++++ python/ribasim/tests/test_io.py | 23 +++++++++++++++++++++++ 3 files changed, 31 insertions(+), 8 deletions(-) diff --git a/python/ribasim/ribasim/input_base.py b/python/ribasim/ribasim/input_base.py index 9dc2ea0a3..1538bfafa 100644 --- a/python/ribasim/ribasim/input_base.py +++ b/python/ribasim/ribasim/input_base.py @@ -289,10 +289,9 @@ def _from_arrow(cls, path: FilePath) -> pd.DataFrame: directory = context_file_loading.get().get("directory", Path(".")) return pd.read_feather(directory / path) - def sort(self, sort_keys: list[str] = ["node_id"]): - """Sort all input tables as required. + def sort(self, sort_keys: list[str]): + """Sort the table as required. - Tables are sorted by "node_id", unless otherwise specified. Sorting is done automatically before writing the table. """ if self.df is not None: @@ -375,7 +374,7 @@ def _write_table(self, path: FilePath) -> None: gdf.to_file(path, layer=self.tablename(), driver="GPKG") - def sort(self, sort_keys: list[str] = ["node_id"]): + def sort(self, sort_keys: list[str]): self.df.sort_index(inplace=True) @@ -402,10 +401,6 @@ def set_modeld( content = serializer(self) return dict(filter(lambda x: x[1], content.items())) - @classmethod - def sort_keys(cls, field: str) -> list[str]: - return cls._sort_keys[field] - @classmethod def get_input_type(cls): return cls.__name__ diff --git a/python/ribasim/tests/conftest.py b/python/ribasim/tests/conftest.py index 4e4c1d09f..f6dbb730d 100644 --- a/python/ribasim/tests/conftest.py +++ b/python/ribasim/tests/conftest.py @@ -32,3 +32,8 @@ def backwater() -> ribasim.Model: @pytest.fixture() def discrete_control_of_pid_control() -> ribasim.Model: return ribasim_testmodels.discrete_control_of_pid_control_model() + + +@pytest.fixture() +def level_setpoint_with_minmax() -> ribasim.Model: + return ribasim_testmodels.level_setpoint_with_minmax_model() diff --git a/python/ribasim/tests/test_io.py b/python/ribasim/tests/test_io.py index 888c692f8..b1ac52056 100644 --- a/python/ribasim/tests/test_io.py +++ b/python/ribasim/tests/test_io.py @@ -102,3 +102,26 @@ def test_extra_columns(basic_transient): node = Node(df=df) assert "meta_node_id" in node.df.columns + + +def test_sort(level_setpoint_with_minmax, tmp_path): + model = level_setpoint_with_minmax + table = model.discrete_control.condition + + # apply a wrong sort, then call the sort method to restore order + table.df.sort_values("greater_than", ascending=False, inplace=True) + assert table.df.iloc[0]["greater_than"] == 15.0 + sort_keys = model.discrete_control._sort_keys["condition"] + assert sort_keys == ["node_id", "listen_feature_id", "variable", "greater_than"] + table.sort(sort_keys) + assert table.df.iloc[0]["greater_than"] == 5.0 + + # re-apply wrong sort, then check if it gets sorted on write + table.df.sort_values("greater_than", ascending=False, inplace=True) + model.write(tmp_path / "basic/ribasim.toml") + # write sorts the model in place + assert table.df.iloc[0]["greater_than"] == 5.0 + model_loaded = ribasim.Model(filepath=tmp_path / "basic/ribasim.toml") + table_loaded = model_loaded.discrete_control.condition + assert table_loaded.df.iloc[0]["greater_than"] == 5.0 + __assert_equal(table.df, table_loaded.df)