src/heuristics/hsp.jl

## HSP family of heuristics ##
export HSPHeuristic, HAdd, HMax
export HSPRHeuristic, HAddR, HMaxR

"""
    HSPHeuristic(op::Function)

A family of relaxed planning graph heuristics, introduced by the HSP 
planner [1]. The heuristic precomputes a graph that stores the dependencies
between all ground actions and plan-relevant conditions. The cost of achieving
each action  (and also the goal) is then recursively estimated as the aggregated
cost of achieving each (pre)condition the action or goal depends upon, where
`op` is an aggregation function (e.g. `max` or `+`).
    
In turn, the cost of achieving each condition (a.k.a. "fact") is estimated
as the minimum cost among all actions that achieve that condition. Once a
condition is achieved by an action, it is considered to remain true through
the rest of the process, hence the relaxed nature of the heuristic.

This implementation supports domains with negative preconditions, disjunctive
preconditions (i.e., `or`, `exists`), and functional preconditions (e.g.
numeric comparisons, or other Boolean-valued functions of non-Boolean fluents).
Functional preconditions are handled by (optimistically) assuming they become
true once a constituent fluent is modified by some action.

[1] B. Bonet and H. Geffner, "Planning as Heuristic Search," Artificial
Intelligence, vol. 129, no. 1, pp. 5–33, Jun. 2001,
<https://doi.org/10.1016/S0004-3702(01)00108-4>.
"""
mutable struct HSPHeuristic{F <: Function} <: Heuristic
    op::F # Aggregator (e.g. max, +) for fact costs
    dynamic_goal::Bool # Flag whether goal-relevant information is dynamic
    goal_hash::Union{Nothing,UInt} # Hash of most recently pre-computed goal
    statics::Vector{Symbol} # Static domain fluents
    graph::PlanningGraph # Precomputed planning graph
    search_state::PlanningGraphSearchState # Preallocated search state
    HSPHeuristic{F}() where {F <: Function} = new{F}(F.instance)
    HSPHeuristic(op::F) where {F <: Function} = new{F}(op)
end

"""
    HMax()

[`HSPHeuristic`](@ref) where an action's cost is the `max` cost of the 
conditions it depends upon.
"""
const HMax = HSPHeuristic{typeof(max)}

"""
    HAdd()

[`HSPHeuristic`](@ref) where an action's cost is the sum of costs of the 
conditions it depends upon.
"""
const HAdd = HSPHeuristic{typeof(+)}

function Base.show(io::IO, h::HSPHeuristic)
    is_precomputed_str = "precomputed=$(is_precomputed(h))"
    print(io, summary(h), "(", h.op, ", ", is_precomputed_str, ")")
end

is_precomputed(h::HSPHeuristic) = isdefined(h, :graph)

function precompute!(h::HSPHeuristic,
                     domain::Domain, state::State)
    # If goal specification is not provided, assume dynamic goal
    h.dynamic_goal = true
    h.goal_hash = nothing
    h.statics = infer_static_fluents(domain)
    h.graph = build_planning_graph(domain, state; statics=h.statics)
    h.search_state = PlanningGraphSearchState(h.graph)
    return h
end

function precompute!(h::HSPHeuristic,
                     domain::Domain, state::State, spec::Specification)
    # If goal specification is provided, assume non-dynamic goal
    h.dynamic_goal = false
    h.goal_hash = hash(get_goal_terms(spec))
    h.statics = infer_static_fluents(domain)
    h.graph = build_planning_graph(domain, state, spec; statics=h.statics)
    h.search_state = PlanningGraphSearchState(h.graph)
    return h
end

function compute(h::HSPHeuristic,
                 domain::Domain, state::State, spec::Specification)
    # If necessary, update planning graph with new goal
    if h.dynamic_goal && hash(get_goal_terms(spec)) != h.goal_hash
        h.graph = update_pgraph_goal!(h.graph, domain, state, spec;
                                      statics=h.statics)
        h.goal_hash = hash(get_goal_terms(spec))
    end
    # Compute relaxed costs to goal nodes of the planning graph
    init_pgraph_search!(h.search_state, h.graph, domain, state)
    _, _, goal_cost = run_pgraph_search!(h.search_state, h.graph, spec, h.op)
    # Return goal cost (may be infinite if unreachable)
    return goal_cost
end

"""
    HSPRHeuristic(op::Function)

A family of relaxed planning graph heuristics for backward search, introduced
by the HSPr planner ("r" stands for regression) [1]. The costs of achieving 
a condition are estimated in the same way as the forward variant, 
[`HSPHeuristic`](@ref), but this estimation is performed only once during 
heuristic precomputation. During heuristic evaluation, the cost from the current
partial state to the start state is estimated as the aggregated cost of each
condition that is true in the partial state.

[1] B. Bonet and H. Geffner, "Planning as Heuristic Search," Artificial
Intelligence, vol. 129, no. 1, pp. 5–33, Jun. 2001,
<https://doi.org/10.1016/S0004-3702(01)00108-4>.
"""
mutable struct HSPRHeuristic{F <: Function} <: Heuristic
    op::F
    costs::Dict{Term,Float64} # Est. cost of reaching each fact from goal
    HSPRHeuristic{F}() where {F <: Function} = new{F}(F.instance)
    HSPRHeuristic(op::F) where {F <: Function} = new{F}(op)
end

"""
    HMaxR()

[`HSPRHeuristic`](@ref) for backward search, where an action's cost is the
`max` cost of its dependencies.
"""
const HMaxR = HSPRHeuristic{typeof(max)}

"""
    HAddR()

[`HSPRHeuristic`](@ref) for backward search, where an action's cost is the
sum of costs of its dependencies.
"""
const HAddR = HSPRHeuristic{typeof(+)}

function Base.show(io::IO, h::HSPRHeuristic)
    is_precomputed_str = "precomputed=$(is_precomputed(h))"
    print(io, summary(h), "(", h.op, ", ", is_precomputed_str, ")")
end

is_precomputed(h::HSPRHeuristic) = isdefined(h, :costs)

function precompute!(h::HSPRHeuristic,
                     domain::Domain, state::State, spec::Specification)
    # Construct and compute fact costs from planning graph
    graph = build_planning_graph(domain, state)
    search_state, _, _ = run_pgraph_search(graph, domain, state, spec, h.op)
    # Convert costs to dictionary for fast look-up
    h.costs = Dict{Term,Float64}(zip(graph.conditions, search_state.cond_costs))
    return h
end

function compute(h::HSPRHeuristic,
                 domain::Domain, state::State, spec::Specification)
    # Compute cost of achieving all facts in current state
    facts = PDDL.get_facts(state)
    # TODO: Handle negative literals
    if length(facts) == 0 return 0.0 end
    return reduce(h.op, (get(h.costs, f, 0) for f in facts))
end