Merge pull request #104 from Herb-AI/refactor-probe

Refactor probe code
Herb-AI · May 19, 2024 · 0d941be · 0d941be
2 parents 0b80af7 + 0cb2514
commit 0d941be
Show file tree

Hide file tree

Showing 8 changed files with 253 additions and 237 deletions.
diff --git a/src/probe/guided_search_iterator.jl b/src/probe/guided_search_iterator.jl
@@ -4,7 +4,7 @@
     symboltable::SymbolTable
 
 )
-@kwdef mutable struct GuidedSearchState
+Base.@kwdef mutable struct GuidedSearchState
     level::Int64
     bank::Vector{Vector{RuleNode}}
     eval_cache::Set
@@ -17,19 +17,20 @@ function Base.iterate(iter::GuidedSearchIterator)
         level=-1,
         bank=[],
         eval_cache=Set(),
-        iter=NewProgramsIterator(0, [], iter.grammar),
+        iter=NewProgramsIterator(0, [], get_grammar(iter.solver)),
         next_iter=nothing
     ))
 end
 
 function Base.iterate(iter::GuidedSearchIterator, state::GuidedSearchState)::Union{Tuple{RuleNode, GuidedSearchState}, Nothing}
+    grammar = get_grammar(iter.solver)
     # wrap in while true to optimize for tail call
     while true
         while state.next_iter === nothing
             state.level += 1
             push!(state.bank, [])
 
-            state.iter = NewProgramsIterator(state.level, state.bank, iter.grammar)
+            state.iter = NewProgramsIterator(state.level, state.bank, grammar) 
             state.next_iter = iterate(state.iter)
             if state.level > 0
                 @info ("Finished level $(state.level - 1) with $(length(state.bank[state.level])) programs")
@@ -45,7 +46,7 @@ function Base.iterate(iter::GuidedSearchIterator, state::GuidedSearchState)::Uni
 
             # evaluate program
             eval_observation = []
-            expr = rulenode2expr(prog, iter.grammar)
+            expr = rulenode2expr(prog, grammar)
             for example ∈ iter.spec
                 output = execute_on_input(iter.symboltable, expr, example.in)
                 push!(eval_observation, output)

diff --git a/src/probe/new_program_iterator.jl b/src/probe/new_program_iterator.jl
@@ -67,3 +67,24 @@ function Base.iterate(iter::NewProgramsIterator, state::NewProgramsState)
     end
     return nothing
 end
+
+function calculate_rule_cost_prob(rule_index, grammar, log_base = 2)
+    log_prob = grammar.log_probabilities[rule_index] / log(log_base)
+    return convert(Int64, round(-log_prob))
+end
+
+function calculate_rule_cost_size(rule_index, grammar)
+    return 1
+end
+
+calculate_rule_cost(rule_index::Int, grammar::ContextSensitiveGrammar) = calculate_rule_cost_size(rule_index, grammar)
+
+"""
+    calculate_program_cost(program::RuleNode, grammar::ContextSensitiveGrammar)  
+Calculates the cost of a program by summing up the cost of the children and the cost of the rule
+"""
+function calculate_program_cost(program::RuleNode, grammar::ContextSensitiveGrammar)
+    cost_children = sum([calculate_program_cost(child, grammar) for child ∈ program.children], init=0)
+    cost_rule = calculate_rule_cost(program.ind, grammar)
+    return cost_children + cost_rule
+end
diff --git a/src/probe/probe_iterator.jl b/src/probe/probe_iterator.jl
@@ -1,6 +1,3 @@
-include("sum_iterator.jl")
-include("new_program_iterator.jl")
-include("guided_search_iterator.jl")
 """
     struct ProgramCache 
 
@@ -17,15 +14,28 @@ function Base.:(==)(a::ProgramCache, b::ProgramCache)
 end
 Base.hash(a::ProgramCache) = hash(a.program)
 
-select(partial_sols::Vector{ProgramCache}, all_selected_psols::Set{ProgramCache}) = HerbSearch.selectpsol_largest_subset(partial_sols, all_selected_psols)
-update!(grammar::ContextSensitiveGrammar, PSols_with_eval_cache::Vector{ProgramCache}, examples::Vector{<:IOExample}) = update_grammar(grammar, PSols_with_eval_cache, examples)
+include("sum_iterator.jl")
+include("new_program_iterator.jl")
+include("guided_search_iterator.jl")
+
+include("select_partial_sols.jl")
+include("update_grammar.jl")
+
+select_partial_solution(partial_sols::Vector{ProgramCache}, all_selected_psols::Set{ProgramCache}) = HerbSearch.selectpsol_largest_subset(partial_sols, all_selected_psols)
+update_grammar!(grammar::ContextSensitiveGrammar, PSols_with_eval_cache::Vector{ProgramCache}, examples::Vector{<:IOExample}) = update_grammar(grammar, PSols_with_eval_cache, examples)
 
+"""
+    probe(examples::Vector{<:IOExample}, iterator::ProgramIterator, max_time::Int, iteration_size::Int)
+
+Probe for a solution using the given `iterator` and `examples` with a time limit of `max_time` and `iteration_size`.
+"""
 function probe(examples::Vector{<:IOExample}, iterator::ProgramIterator, max_time::Int, iteration_size::Int)
     start_time = time()
     # store a set of all the results of evaluation programs
     eval_cache = Set()
     state = nothing
-    symboltable = SymbolTable(iterator.grammar)
+    grammar = get_grammar(iterator.solver)
+    symboltable = SymbolTable(grammar)
     # all partial solutions that were found so far
     all_selected_psols = Set{ProgramCache}()
     # start next iteration while there is time left
@@ -40,7 +50,7 @@ function probe(examples::Vector{<:IOExample}, iterator::ProgramIterator, max_tim
             # evaluate program
             eval_observation = []
             correct_examples = Vector{Int}()
-            expr = rulenode2expr(program, iterator.grammar)
+            expr = rulenode2expr(program, grammar)
             for (example_index, example) ∈ enumerate(examples)
                 output = execute_on_input(symboltable, expr, example.in)
                 push!(eval_observation, output)
@@ -52,13 +62,13 @@ function probe(examples::Vector{<:IOExample}, iterator::ProgramIterator, max_tim
 
             nr_correct_examples = length(correct_examples)
             if nr_correct_examples == length(examples) # found solution
-                println("Last level: $(length(state.bank[state.level + 1])) programs")
+                @info "Last level: $(length(state.bank[state.level + 1])) programs"
                 return program
             elseif eval_observation in eval_cache # result already in cache
                 next = iterate(iterator, state)
                 continue
             elseif nr_correct_examples >= 1 # partial solution 
-                program_cost = calculate_program_cost(program, iterator.grammar)
+                program_cost = calculate_program_cost(program, grammar)
                 push!(psol_with_eval_cache, ProgramCache(program, correct_examples, program_cost))
             end
 
@@ -72,174 +82,23 @@ function probe(examples::Vector{<:IOExample}, iterator::ProgramIterator, max_tim
         if next === nothing
             return nothing
         end
-        partial_sols = filter(x -> x ∉ all_selected_psols, select(psol_with_eval_cache, all_selected_psols))
+        partial_sols = filter(x -> x ∉ all_selected_psols, select_partial_solution(psol_with_eval_cache, all_selected_psols))
         if !isempty(partial_sols)
-            print(rulenode2expr(partial_sols[1].program, iterator.grammar))
             push!(all_selected_psols, partial_sols...)
             # update probabilites if any promising partial solutions
-            update!(iterator.grammar, partial_sols, examples) # update probabilites
+            update_grammar!(grammar, partial_sols, examples) # update probabilites
             # restart iterator
             eval_cache = Set()
             state = nothing
 
             #for loop to update all_selected_psols with new costs
             for prog_with_cache ∈ all_selected_psols
                 program = prog_with_cache.program
-                new_cost = calculate_program_cost(program, iterator.grammar)
+                new_cost = calculate_program_cost(program, grammar)
                 prog_with_cache.cost = new_cost
             end
         end
     end
 
     return nothing
 end
-
-function update_grammar(grammar::ContextSensitiveGrammar, PSols_with_eval_cache::Vector{ProgramCache}, examples::Vector{<:IOExample})
-    sum = 0
-    for rule_index in eachindex(grammar.rules) # iterate for each rule_index 
-        highest_correct_nr = 0
-        for psol in PSols_with_eval_cache
-            program = psol.program
-            len_correct_examples = length(psol.correct_examples)
-            # check if the program tree has rule_index somewhere inside it using a recursive function
-            if contains_rule(program, rule_index) && len_correct_examples > highest_correct_nr
-                highest_correct_nr = len_correct_examples
-            end
-        end
-        fitnes = highest_correct_nr / length(examples)
-        p_uniform = 1 / length(grammar.rules)
-
-        # compute (log2(p_u) ^ (1 - fit)) = (1-fit) * log2(p_u)
-        sum += p_uniform^(1 - fitnes)
-        log_prob = ((1 - fitnes) * log(2, p_uniform))
-        grammar.log_probabilities[rule_index] = log_prob
-    end
-    total_sum = 0
-    for rule_index in eachindex(grammar.rules)
-        grammar.log_probabilities[rule_index] = grammar.log_probabilities[rule_index] - log(2, sum)
-        total_sum += 2^(grammar.log_probabilities[rule_index])
-    end
-    @assert abs(total_sum - 1) <= 1e-4 "Total sum is $(total_sum) "
-end
-
-"""
-    contains_rule(program::RuleNode, rule_index::Int)
-
-Check if a given `RuleNode` contains has used a derivation rule with the specified `rule_index`
-
-# Arguments
-- `program::RuleNode`: The `RuleNode` to check.
-- `rule_index::Int`: The index of the rule to check for.
-
-"""
-function contains_rule(program::RuleNode, rule_index::Int)
-    if program.ind == rule_index # if the rule is good return true
-        return true
-    else
-        for child in program.children
-            if contains_rule(child, rule_index)  # if a child has that rule then return true
-                return true
-            end
-        end
-        return false # if no child has that rule return false
-    end
-end
-
-
-
-"""
-    selectpsol_largest_subset(partial_sols::Vector{ProgramCache}}, all_selected_psols::Set{ProgramCache})) 
-
-This scheme selects a single cheapest program (first enumerated) that 
-satisfies the largest subset of examples encountered so far across all partial_sols.
-"""
-function selectpsol_largest_subset(partial_sols::Vector{ProgramCache}, all_selected_psols::Set{ProgramCache})
-    if isempty(partial_sols)
-        return Vector{ProgramCache}()
-    end
-    push!(partial_sols, all_selected_psols...)
-    largest_subset_length = 0
-    cost = typemax(Int)
-    best_sol = partial_sols[begin]
-    for psol in partial_sols
-        len = length(psol.correct_examples)
-        if len > largest_subset_length || len == largest_subset_length && psol.cost < cost
-            largest_subset_length = len
-            best_sol = psol
-            cost = psol.cost
-        end
-    end
-    return [best_sol]
-end
-
-"""
-    selectpsol_first_cheapest(partial_sols::Vector{ProgramCache}}, all_selected_psols::Set{ProgramCache})) 
-
-This scheme selects a single cheapest program (first enumerated) that 
-satisfies a unique subset of examples.
-"""
-function selectpsol_first_cheapest(partial_sols::Vector{ProgramCache}, all_selected_psol::Set{ProgramCache})
-    # maps subset of examples to the cheapest program 
-    mapping = Dict{Vector{Int},ProgramCache}()
-    for sol ∈ partial_sols
-        examples = sol.correct_examples
-        if !haskey(mapping, examples)
-            mapping[examples] = sol
-        else
-            # if the cost of the new program is less than the cost of the previous program with the same subset of examples replace it
-            if sol.cost < mapping[examples].cost
-                mapping[examples] = sol
-            end
-        end
-    end
-    # get the cheapest programs that satisfy unique subsets of examples
-    return collect(values(mapping))
-end
-
-"""
-    selectpsol_all_cheapest(partial_sols::Vector{ProgramCache}, all_selected_psol::Set{ProgramCache}) 
-
-This scheme selects all cheapest programs that satisfies a unique subset of examples.
-"""
-function selectpsol_all_cheapest(partial_sols::Vector{ProgramCache}, all_selected_psol::Set{ProgramCache})
-    # maps subset of examples to the cheapest program 
-    mapping = Dict{Vector{Int},Vector{ProgramCache}}()
-    for sol ∈ partial_sols
-        examples = sol.correct_examples
-        if !haskey(mapping, examples)
-            mapping[examples] = [sol]
-        else
-            # if the cost of the new program is less than the cost of the first program
-            progs = mapping[examples]
-            if sol.cost < progs[begin].cost
-                mapping[examples] = [sol]
-            elseif sol.cost == progs[begin].cost
-                # append to the list of cheapest programs
-                push!(progs, sol)
-            end
-        end
-    end
-    # get all cheapest programs that satisfy unique subsets of examples
-    return collect(Iterators.flatten(values(mapping)))
-end
-
-function calculate_rule_cost_prob(rule_index, grammar)
-    log_prob = grammar.log_probabilities[rule_index]
-    return convert(Int64, round(-log_prob))
-end
-
-function calculate_rule_cost_size(rule_index, grammar)
-    return 1
-end
-
-calculate_rule_cost(rule_index::Int, grammar::ContextSensitiveGrammar) = calculate_rule_cost_size(rule_index, grammar)
-
-"""
-    calculate_program_cost(program::RuleNode, grammar::ContextSensitiveGrammar)  
-Calculates the cost of a program by summing up the cost of the children and the cost of the rule
-"""
-function calculate_program_cost(program::RuleNode, grammar::ContextSensitiveGrammar)
-    cost_children = sum([calculate_program_cost(child, grammar) for child ∈ program.children], init=0)
-    cost_rule = calculate_rule_cost(program.ind, grammar)
-    return cost_children + cost_rule
-end
diff --git a/src/probe/select_partial_sols.jl b/src/probe/select_partial_sols.jl
@@ -0,0 +1,75 @@
+"""
+    selectpsol_largest_subset(partial_sols::Vector{ProgramCache}}, all_selected_psols::Set{ProgramCache})) 
+
+This scheme selects a single cheapest program (first enumerated) that 
+satisfies the largest subset of examples encountered so far across all partial_sols.
+"""
+function selectpsol_largest_subset(partial_sols::Vector{ProgramCache}, all_selected_psols::Set{ProgramCache})
+    if isempty(partial_sols)
+        return Vector{ProgramCache}()
+    end
+    push!(partial_sols, all_selected_psols...)
+    largest_subset_length = 0
+    cost = typemax(Int)
+    best_sol = partial_sols[begin]
+    for psol in partial_sols
+        len = length(psol.correct_examples)
+        if len > largest_subset_length || len == largest_subset_length && psol.cost < cost
+            largest_subset_length = len
+            best_sol = psol
+            cost = psol.cost
+        end
+    end
+    return [best_sol]
+end
+
+"""
+    selectpsol_first_cheapest(partial_sols::Vector{ProgramCache}}, all_selected_psols::Set{ProgramCache})) 
+
+This scheme selects a single cheapest program (first enumerated) that 
+satisfies a unique subset of examples.
+"""
+function selectpsol_first_cheapest(partial_sols::Vector{ProgramCache}, all_selected_psol::Set{ProgramCache})
+    # maps subset of examples to the cheapest program 
+    mapping = Dict{Vector{Int},ProgramCache}()
+    for sol ∈ partial_sols
+        examples = sol.correct_examples
+        if !haskey(mapping, examples)
+            mapping[examples] = sol
+        else
+            # if the cost of the new program is less than the cost of the previous program with the same subset of examples replace it
+            if sol.cost < mapping[examples].cost
+                mapping[examples] = sol
+            end
+        end
+    end
+    # get the cheapest programs that satisfy unique subsets of examples
+    return collect(values(mapping))
+end
+
+"""
+    selectpsol_all_cheapest(partial_sols::Vector{ProgramCache}, all_selected_psol::Set{ProgramCache}) 
+
+This scheme selects all cheapest programs that satisfies a unique subset of examples.
+"""
+function selectpsol_all_cheapest(partial_sols::Vector{ProgramCache}, all_selected_psol::Set{ProgramCache})
+    # maps subset of examples to the cheapest program 
+    mapping = Dict{Vector{Int},Vector{ProgramCache}}()
+    for sol ∈ partial_sols
+        examples = sol.correct_examples
+        if !haskey(mapping, examples)
+            mapping[examples] = [sol]
+        else
+            # if the cost of the new program is less than the cost of the first program
+            progs = mapping[examples]
+            if sol.cost < progs[begin].cost
+                mapping[examples] = [sol]
+            elseif sol.cost == progs[begin].cost
+                # append to the list of cheapest programs
+                push!(progs, sol)
+            end
+        end
+    end
+    # get all cheapest programs that satisfy unique subsets of examples
+    return collect(Iterators.flatten(values(mapping)))
+end
diff --git a/src/probe/sum_iterator.jl b/src/probe/sum_iterator.jl
@@ -17,7 +17,7 @@ for option ∈ sum_iter
 end
 ```
 """
-@kwdef struct SumIterator
+Base.@kwdef struct SumIterator
     number_of_elements::Int
     desired_sum::Int
     max_value::Int