Skip to content

Commit

Permalink
Move incoming and outgoing flow computation to DuckDB
Browse files Browse the repository at this point in the history
Related to #895
  • Loading branch information
abelsiqueira committed Nov 4, 2024
1 parent f27f85e commit 64be059
Show file tree
Hide file tree
Showing 4 changed files with 162 additions and 13 deletions.
3 changes: 3 additions & 0 deletions src/create-model.jl
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,7 @@ function create_model!(energy_problem; kwargs...)
dataframes = energy_problem.dataframes
sets = create_sets(graph, years)
energy_problem.model = @timeit to "create_model" create_model(
energy_problem.db_connection,
graph,
sets,
variables,
Expand Down Expand Up @@ -44,6 +45,7 @@ end
Create the energy model given the `graph`, `representative_periods`, dictionary of `dataframes` (created by [`construct_dataframes`](@ref)), timeframe, and groups.
"""
function create_model(
connection,
graph,
sets,
variables,
Expand Down Expand Up @@ -115,6 +117,7 @@ function create_model(
incoming_flow_storage_inter_rp_balance,
outgoing_flow_storage_inter_rp_balance,
) = add_expressions_to_dataframe!(
connection,
dataframes,
variables,
model,
Expand Down
57 changes: 46 additions & 11 deletions src/model-preparation.jl
Original file line number Diff line number Diff line change
Expand Up @@ -62,8 +62,14 @@ function construct_dataframes(

tmp_create_constraints_indices(connection)

# WIP: Can these queries be left undordered by the end of the refactor?
# WIP: highest_in_out is not included in constraints_partition anymore
dataframes[:highest_in_out] = TulipaIO.get_table(connection, "cons_indices_highest_in_out")
dataframes[:highest_in_out] =
DuckDB.query(
connection,
"SELECT * FROM cons_indices_highest_in_out
ORDER BY asset, year, rep_period, time_block_start",
) |> DataFrame
dataframes[:highest_in_out].timesteps_block = map(
r -> r[1]:r[2],
zip(
Expand All @@ -74,7 +80,12 @@ function construct_dataframes(
dataframes[:highest_in_out].index = 1:size(dataframes[:highest_in_out], 1)

# WIP: highest_in is not included in constraints_partition anymore
dataframes[:highest_in] = TulipaIO.get_table(connection, "cons_indices_highest_in")
dataframes[:highest_in] =
DuckDB.query(
connection,
"SELECT * FROM cons_indices_highest_in
ORDER BY asset, year, rep_period, time_block_start",
) |> DataFrame
dataframes[:highest_in].timesteps_block = map(
r -> r[1]:r[2],
zip(dataframes[:highest_in].time_block_start, dataframes[:highest_in].time_block_end),
Expand Down Expand Up @@ -479,6 +490,7 @@ function add_expression_terms_inter_rp_constraints!(
end

function add_expressions_to_dataframe!(
connection,
dataframes,
variables,
model,
Expand Down Expand Up @@ -511,15 +523,38 @@ function add_expressions_to_dataframe!(
use_highest_resolution = false,
multiply_by_duration = true,
)
add_expression_terms_intra_rp_constraints!(
dataframes[:highest_in_out],
dataframes[:flows],
expression_workspace,
representative_periods,
graph;
use_highest_resolution = true,
multiply_by_duration = false,
)
# WIP: Changing the function below
# add_expression_terms_intra_rp_constraints!(
# dataframes[:highest_in_out],
# dataframes[:flows],
# expression_workspace,
# representative_periods,
# graph;
# use_highest_resolution = true,
# multiply_by_duration = false,
# )
dataframes[:highest_in_out].incoming_flow = JuMP.AffExpr[
if length(row.indices) > 0
sum(unique(variables[:flow].container[row.indices]))
else
JuMP.AffExpr(0.0)
end for row in DuckDB.query(
connection,
"SELECT * FROM highest_in_out_incoming
ORDER BY asset, year, rep_period, time_block_start",
)
]
dataframes[:highest_in_out].outgoing_flow = JuMP.AffExpr[
if length(row.indices) > 0
sum(unique(variables[:flow].container[row.indices]))
else
JuMP.AffExpr(0.0)
end for row in DuckDB.query(
connection,
"SELECT * FROM highest_in_out_outgoing
ORDER BY asset, year, rep_period, time_block_start",
)
]
add_expression_terms_intra_rp_constraints!(
dataframes[:highest_in],
dataframes[:flows],
Expand Down
114 changes: 112 additions & 2 deletions src/tmp.jl
Original file line number Diff line number Diff line change
Expand Up @@ -124,7 +124,7 @@ function tmp_create_partition_tables(connection)

DBInterface.execute(
connection,
"CREATE OR REPLACE TABLE flow_time_resolution(
"CREATE OR REPLACE TEMP TABLE t_flow_time_resolution(
from_asset STRING,
to_asset STRING,
year INT,
Expand All @@ -135,7 +135,7 @@ function tmp_create_partition_tables(connection)
)",
)

appender = DuckDB.Appender(connection, "flow_time_resolution")
appender = DuckDB.Appender(connection, "t_flow_time_resolution")
for row in TulipaIO.get_table(Val(:raw), connection, "explicit_flows_rep_periods_partitions")
durations = if row.specification == "uniform"
step = parse(Int, row.partition)
Expand All @@ -157,6 +157,17 @@ function tmp_create_partition_tables(connection)
_append_given_durations(appender, row, durations)
end
DuckDB.close(appender)

DBInterface.execute(
connection,
"CREATE OR REPLACE TABLE flow_time_resolution
AS
SELECT
*,
row_number() OVER (ORDER BY from_asset, to_asset, year, rep_period, time_block_start) AS variable_index
FROM t_flow_time_resolution
",
)
end

function tmp_create_constraints_indices(connection)
Expand Down Expand Up @@ -265,6 +276,9 @@ function tmp_create_constraints_indices(connection)
WHERE main.type in ('storage')
",
)

# WIP: For now, the incoming and outgoing expressions are being computed here
tmp_create_expressions(connection)
end

"""
Expand Down Expand Up @@ -303,3 +317,99 @@ function tmp_example_of_flow_expression_problem()

return connection, ep
end

function tmp_create_expressions(connection)
DuckDB.execute(
connection,
"CREATE OR REPLACE TABLE t_incoming_nonzero AS
SELECT
t_flows.from_asset,
t_flows.to_asset,
t_flows.year,
t_flows.rep_period,
t_flows.variable_index,
t_cons.time_block_start,
greatest(0, 1 +
least(t_flows.time_block_end,t_cons.time_block_end)
- greatest(t_flows.time_block_start,t_cons.time_block_start)) AS duration
FROM flow_time_resolution AS t_flows
INNER JOIN cons_indices_highest_in_out AS t_cons
ON t_flows.to_asset=t_cons.asset
AND t_flows.year=t_cons.year
AND t_flows.rep_period=t_cons.rep_period
WHERE duration > 0",
)

DuckDB.execute(
connection,
"CREATE OR REPLACE TABLE t_outgoing_nonzero AS
SELECT
t_flows.from_asset,
t_flows.to_asset,
t_flows.year,
t_flows.rep_period,
t_flows.variable_index,
t_cons.time_block_start,
greatest(0, 1 +
least(t_flows.time_block_end,t_cons.time_block_end)
- greatest(t_flows.time_block_start,t_cons.time_block_start)) AS duration
FROM flow_time_resolution AS t_flows
INNER JOIN cons_indices_highest_in_out AS t_cons
ON t_flows.from_asset=t_cons.asset
AND t_flows.year=t_cons.year
AND t_flows.rep_period=t_cons.rep_period
WHERE duration > 0",
)

DuckDB.execute(
connection,
"CREATE OR REPLACE TABLE highest_in_out_incoming AS
SELECT
t1.asset, t1.year, t1.rep_period, t1.time_block_start,
COALESCE(indices, []) AS indices,
COALESCE(durations, []) AS durations,
FROM cons_indices_highest_in_out AS t1
LEFT JOIN (
SELECT
to_asset as asset,
year,
rep_period,
time_block_start,
array_agg(variable_index) AS indices,
array_agg(duration) AS durations,
FROM t_incoming_nonzero
GROUP BY to_asset, year, rep_period, time_block_start
) AS t2
ON t1.asset=t2.asset
AND t1.year=t2.year
AND t1.rep_period=t2.rep_period
AND t1.time_block_start=t2.time_block_start
",
)

DuckDB.execute(
connection,
"CREATE OR REPLACE TABLE highest_in_out_outgoing AS
SELECT
t1.asset, t1.year, t1.rep_period, t1.time_block_start,
COALESCE(indices, []) AS indices,
COALESCE(durations, []) AS durations,
FROM cons_indices_highest_in_out AS t1
LEFT JOIN (
SELECT
from_asset as asset,
year,
rep_period,
time_block_start,
array_agg(variable_index) AS indices,
array_agg(duration) AS durations,
FROM t_outgoing_nonzero
GROUP BY from_asset, year, rep_period, time_block_start
) AS t2
ON t1.asset=t2.asset
AND t1.year=t2.year
AND t1.rep_period=t2.rep_period
AND t1.time_block_start=t2.time_block_start
",
)
end
1 change: 1 addition & 0 deletions test/test-pipeline.jl
Original file line number Diff line number Diff line change
Expand Up @@ -36,6 +36,7 @@ end

# Create model
model = create_model(
connection,
graph,
sets,
variables,
Expand Down

0 comments on commit 64be059

Please sign in to comment.