2024-06-27 03:01:39 -04:00
|
|
|
/*
|
|
|
|
* <Short Description>
|
|
|
|
* Copyright (C) 2024 Brett Terpstra
|
|
|
|
*
|
|
|
|
* This program is free software: you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
|
|
* (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* along with this program. If not, see <https://www.gnu.org/licenses/>.
|
|
|
|
*/
|
|
|
|
#include <blt/gp/transformers.h>
|
2024-06-30 21:44:45 -04:00
|
|
|
#include <blt/gp/program.h>
|
2024-07-02 13:57:46 -04:00
|
|
|
#include <blt/std/ranges.h>
|
2024-08-03 13:16:53 -04:00
|
|
|
#include <blt/std/utility.h>
|
2024-08-06 02:46:01 -04:00
|
|
|
#include <algorithm>
|
|
|
|
#include <blt/std/memory.h>
|
2024-08-05 02:40:16 -04:00
|
|
|
#include <blt/profiling/profiler_v2.h>
|
2024-06-30 21:44:45 -04:00
|
|
|
#include <random>
|
2024-06-27 03:01:39 -04:00
|
|
|
|
|
|
|
namespace blt::gp
|
|
|
|
{
|
2024-08-06 02:46:01 -04:00
|
|
|
|
|
|
|
inline blt::size_t accumulate_type_sizes(detail::op_iter begin, detail::op_iter end)
|
|
|
|
{
|
|
|
|
blt::size_t total = 0;
|
|
|
|
for (auto it = begin; it != end; ++it)
|
|
|
|
{
|
|
|
|
if (it->is_value)
|
|
|
|
total += stack_allocator::aligned_size(it->type_size);
|
|
|
|
}
|
|
|
|
return total;
|
|
|
|
}
|
|
|
|
|
|
|
|
template<typename>
|
|
|
|
blt::u8* get_thread_pointer_for_size(blt::size_t bytes)
|
|
|
|
{
|
|
|
|
static thread_local blt::expanding_buffer<blt::u8> buffer;
|
|
|
|
if (bytes > buffer.size())
|
|
|
|
buffer.resize(bytes);
|
|
|
|
return buffer.data();
|
|
|
|
}
|
|
|
|
|
2024-07-09 03:57:58 -04:00
|
|
|
grow_generator_t grow_generator;
|
|
|
|
|
2024-08-06 02:46:01 -04:00
|
|
|
mutation_t::config_t::config_t(): generator(grow_generator)
|
|
|
|
{}
|
|
|
|
|
2024-06-30 03:20:56 -04:00
|
|
|
blt::expected<crossover_t::result_t, crossover_t::error_t> crossover_t::apply(gp_program& program, const tree_t& p1, const tree_t& p2) // NOLINT
|
|
|
|
{
|
|
|
|
result_t result{p1, p2};
|
2024-07-03 14:04:48 -04:00
|
|
|
|
2024-06-30 21:44:45 -04:00
|
|
|
auto& c1 = result.child1;
|
|
|
|
auto& c2 = result.child2;
|
2024-06-30 03:20:56 -04:00
|
|
|
|
2024-06-30 21:44:45 -04:00
|
|
|
auto& c1_ops = c1.get_operations();
|
|
|
|
auto& c2_ops = c2.get_operations();
|
|
|
|
|
2024-07-02 13:57:46 -04:00
|
|
|
if (c1_ops.size() < 5 || c2_ops.size() < 5)
|
|
|
|
return blt::unexpected(error_t::TREE_TOO_SMALL);
|
|
|
|
|
2024-07-20 13:02:41 -04:00
|
|
|
auto point = get_crossover_point(program, c1, c2);
|
|
|
|
|
|
|
|
if (!point)
|
|
|
|
return blt::unexpected(point.error());
|
|
|
|
|
|
|
|
auto crossover_point_begin_itr = c1_ops.begin() + point->p1_crossover_point;
|
|
|
|
auto crossover_point_end_itr = c1_ops.begin() + find_endpoint(program, c1_ops, point->p1_crossover_point);
|
2024-08-02 21:08:34 -04:00
|
|
|
|
2024-07-20 13:02:41 -04:00
|
|
|
auto found_point_begin_itr = c2_ops.begin() + point->p2_crossover_point;
|
|
|
|
auto found_point_end_itr = c2_ops.begin() + find_endpoint(program, c2_ops, point->p2_crossover_point);
|
|
|
|
|
2024-08-06 02:46:01 -04:00
|
|
|
stack_allocator& c1_stack = c1.get_values();
|
|
|
|
stack_allocator& c2_stack = c2.get_values();
|
2024-07-20 13:02:41 -04:00
|
|
|
|
2024-07-20 15:45:07 -04:00
|
|
|
// we have to make a copy because we will modify the underlying storage.
|
2024-07-20 13:02:41 -04:00
|
|
|
std::vector<op_container_t> c1_operators;
|
|
|
|
std::vector<op_container_t> c2_operators;
|
|
|
|
|
2024-07-20 15:45:07 -04:00
|
|
|
for (const auto& op : blt::iterate(crossover_point_begin_itr, crossover_point_end_itr))
|
2024-07-20 13:02:41 -04:00
|
|
|
c1_operators.push_back(op);
|
2024-07-20 15:45:07 -04:00
|
|
|
for (const auto& op : blt::iterate(found_point_begin_itr, found_point_end_itr))
|
2024-07-20 13:02:41 -04:00
|
|
|
c2_operators.push_back(op);
|
|
|
|
|
2024-08-06 02:46:01 -04:00
|
|
|
blt::size_t c1_stack_after_bytes = accumulate_type_sizes(crossover_point_end_itr, c1_ops.end());
|
|
|
|
blt::size_t c1_stack_for_bytes = accumulate_type_sizes(crossover_point_begin_itr, crossover_point_end_itr);
|
|
|
|
blt::size_t c2_stack_after_bytes = accumulate_type_sizes(found_point_end_itr, c2_ops.end());
|
|
|
|
blt::size_t c2_stack_for_bytes = accumulate_type_sizes(found_point_begin_itr, found_point_end_itr);
|
|
|
|
auto c1_total = static_cast<blt::ptrdiff_t>(c1_stack_after_bytes + c1_stack_for_bytes);
|
|
|
|
auto c2_total = static_cast<blt::ptrdiff_t>(c2_stack_after_bytes + c2_stack_for_bytes);
|
|
|
|
auto copy_ptr_c1 = get_thread_pointer_for_size<struct c1>(c1_total);
|
|
|
|
auto copy_ptr_c2 = get_thread_pointer_for_size<struct c2>(c2_total);
|
|
|
|
|
|
|
|
c1_stack.copy_to(copy_ptr_c1, c1_total);
|
|
|
|
c1_stack.pop_bytes(c1_total);
|
2024-07-20 13:02:41 -04:00
|
|
|
|
2024-08-06 02:46:01 -04:00
|
|
|
c2_stack.copy_to(copy_ptr_c2, c2_total);
|
|
|
|
c2_stack.pop_bytes(c2_total);
|
|
|
|
|
|
|
|
c2_stack.copy_from(copy_ptr_c1, c1_stack_for_bytes);
|
|
|
|
c2_stack.copy_from(copy_ptr_c2 + c2_stack_for_bytes, c2_stack_after_bytes);
|
|
|
|
|
|
|
|
c1_stack.copy_from(copy_ptr_c2, c2_stack_for_bytes);
|
|
|
|
c1_stack.copy_from(copy_ptr_c1 + c1_stack_for_bytes, c1_stack_after_bytes);
|
|
|
|
|
2024-07-20 13:02:41 -04:00
|
|
|
// now swap the operators
|
|
|
|
auto insert_point_c1 = crossover_point_begin_itr - 1;
|
|
|
|
auto insert_point_c2 = found_point_begin_itr - 1;
|
|
|
|
|
|
|
|
// invalidates [begin, end()) so the insert points should be fine
|
|
|
|
c1_ops.erase(crossover_point_begin_itr, crossover_point_end_itr);
|
|
|
|
c2_ops.erase(found_point_begin_itr, found_point_end_itr);
|
|
|
|
|
|
|
|
c1_ops.insert(++insert_point_c1, c2_operators.begin(), c2_operators.end());
|
|
|
|
c2_ops.insert(++insert_point_c2, c1_operators.begin(), c1_operators.end());
|
2024-08-02 21:08:34 -04:00
|
|
|
|
|
|
|
#if BLT_DEBUG_LEVEL >= 2
|
|
|
|
blt::size_t c1_found_bytes = result.child1.get_values().size().total_used_bytes;
|
|
|
|
blt::size_t c2_found_bytes = result.child2.get_values().size().total_used_bytes;
|
|
|
|
blt::size_t c1_expected_bytes = std::accumulate(result.child1.get_operations().begin(), result.child1.get_operations().end(), 0ul,
|
|
|
|
[](const auto& v1, const auto& v2) {
|
|
|
|
if (v2.is_value)
|
|
|
|
return v1 + stack_allocator::aligned_size(v2.type_size);
|
|
|
|
return v1;
|
|
|
|
});
|
|
|
|
blt::size_t c2_expected_bytes = std::accumulate(result.child2.get_operations().begin(), result.child2.get_operations().end(), 0ul,
|
|
|
|
[](const auto& v1, const auto& v2) {
|
|
|
|
if (v2.is_value)
|
|
|
|
return v1 + stack_allocator::aligned_size(v2.type_size);
|
|
|
|
return v1;
|
|
|
|
});
|
|
|
|
if (c1_found_bytes != c1_expected_bytes || c2_found_bytes != c2_expected_bytes)
|
|
|
|
{
|
|
|
|
BLT_WARN("C1 Found bytes %ld vs Expected Bytes %ld", c1_found_bytes, c1_expected_bytes);
|
|
|
|
BLT_WARN("C2 Found bytes %ld vs Expected Bytes %ld", c2_found_bytes, c2_expected_bytes);
|
|
|
|
BLT_ABORT("Amount of bytes in stack doesn't match the number of bytes expected for the operations");
|
|
|
|
}
|
|
|
|
#endif
|
2024-07-20 13:02:41 -04:00
|
|
|
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
|
|
|
blt::expected<crossover_t::crossover_point_t, crossover_t::error_t> crossover_t::get_crossover_point(gp_program& program, const tree_t& c1,
|
|
|
|
const tree_t& c2) const
|
|
|
|
{
|
|
|
|
auto& c1_ops = c1.get_operations();
|
|
|
|
auto& c2_ops = c2.get_operations();
|
|
|
|
|
2024-07-09 21:57:18 -04:00
|
|
|
blt::size_t crossover_point = program.get_random().get_size_t(1ul, c1_ops.size());
|
2024-07-03 21:27:57 -04:00
|
|
|
|
|
|
|
while (config.avoid_terminals && program.get_operator_info(c1_ops[crossover_point].id).argc.is_terminal())
|
2024-07-09 21:57:18 -04:00
|
|
|
crossover_point = program.get_random().get_size_t(1ul, c1_ops.size());
|
2024-07-03 21:27:57 -04:00
|
|
|
|
2024-06-30 21:44:45 -04:00
|
|
|
blt::size_t attempted_point = 0;
|
|
|
|
|
|
|
|
const auto& crossover_point_type = program.get_operator_info(c1_ops[crossover_point].id);
|
|
|
|
operator_info* attempted_point_type = nullptr;
|
|
|
|
|
|
|
|
blt::size_t counter = 0;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
if (counter >= config.max_crossover_tries)
|
|
|
|
{
|
|
|
|
if (config.should_crossover_try_forward)
|
|
|
|
{
|
2024-07-03 21:27:57 -04:00
|
|
|
bool found = false;
|
2024-06-30 21:44:45 -04:00
|
|
|
for (auto i = attempted_point + 1; i < c2_ops.size(); i++)
|
|
|
|
{
|
|
|
|
auto* info = &program.get_operator_info(c2_ops[i].id);
|
|
|
|
if (info->return_type == crossover_point_type.return_type)
|
|
|
|
{
|
2024-07-03 21:27:57 -04:00
|
|
|
if (config.avoid_terminals && info->argc.is_terminal())
|
|
|
|
continue;
|
2024-06-30 21:44:45 -04:00
|
|
|
attempted_point = i;
|
|
|
|
attempted_point_type = info;
|
2024-07-03 21:27:57 -04:00
|
|
|
found = true;
|
2024-06-30 21:44:45 -04:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2024-07-03 21:27:57 -04:00
|
|
|
if (!found)
|
|
|
|
return blt::unexpected(error_t::NO_VALID_TYPE);
|
2024-06-30 21:44:45 -04:00
|
|
|
}
|
|
|
|
// should we try again over the whole tree? probably not.
|
|
|
|
return blt::unexpected(error_t::NO_VALID_TYPE);
|
|
|
|
} else
|
|
|
|
{
|
2024-07-09 21:57:18 -04:00
|
|
|
attempted_point = program.get_random().get_size_t(1ul, c2_ops.size());
|
2024-06-30 21:44:45 -04:00
|
|
|
attempted_point_type = &program.get_operator_info(c2_ops[attempted_point].id);
|
2024-07-03 21:27:57 -04:00
|
|
|
if (config.avoid_terminals && attempted_point_type->argc.is_terminal())
|
|
|
|
continue;
|
|
|
|
if (crossover_point_type.return_type == attempted_point_type->return_type)
|
|
|
|
break;
|
2024-06-30 21:44:45 -04:00
|
|
|
counter++;
|
|
|
|
}
|
2024-07-03 21:27:57 -04:00
|
|
|
} while (true);
|
2024-06-30 21:44:45 -04:00
|
|
|
|
2024-07-20 13:02:41 -04:00
|
|
|
return crossover_point_t{static_cast<blt::ptrdiff_t>(crossover_point), static_cast<blt::ptrdiff_t>(attempted_point)};
|
|
|
|
}
|
|
|
|
|
2024-07-09 03:57:58 -04:00
|
|
|
tree_t mutation_t::apply(gp_program& program, const tree_t& p)
|
2024-07-08 22:20:51 -04:00
|
|
|
{
|
|
|
|
auto c = p;
|
|
|
|
|
2024-08-03 13:16:53 -04:00
|
|
|
auto& ops_r = c.get_operations();
|
|
|
|
auto& vals_r = c.get_values();
|
2024-07-08 22:20:51 -04:00
|
|
|
|
2024-08-03 13:16:53 -04:00
|
|
|
auto begin_point = static_cast<blt::ptrdiff_t>(program.get_random().get_size_t(0ul, ops_r.size()));
|
|
|
|
auto end_point = find_endpoint(program, ops_r, begin_point);
|
2024-08-04 19:43:59 -04:00
|
|
|
auto begin_operator_id = ops_r[begin_point].id;
|
|
|
|
const auto& type_info = program.get_operator_info(begin_operator_id);
|
2024-07-08 22:20:51 -04:00
|
|
|
|
2024-08-03 13:16:53 -04:00
|
|
|
auto begin_itr = ops_r.begin() + begin_point;
|
|
|
|
auto end_itr = ops_r.begin() + end_point;
|
2024-07-08 22:20:51 -04:00
|
|
|
|
2024-07-09 03:57:58 -04:00
|
|
|
auto new_tree = config.generator.get().generate({program, type_info.return_type, config.replacement_min_depth, config.replacement_max_depth});
|
2024-07-08 22:20:51 -04:00
|
|
|
|
2024-08-03 13:16:53 -04:00
|
|
|
auto& new_ops_r = new_tree.get_operations();
|
|
|
|
auto& new_vals_r = new_tree.get_values();
|
2024-07-08 22:20:51 -04:00
|
|
|
|
2024-08-06 02:46:01 -04:00
|
|
|
blt::size_t total_bytes_after = accumulate_type_sizes(end_itr, ops_r.end());
|
|
|
|
auto* stack_after_data = get_thread_pointer_for_size<struct mutation>(total_bytes_after);
|
|
|
|
|
|
|
|
// make a copy of any stack data after the mutation point / children.
|
|
|
|
vals_r.copy_to(stack_after_data, total_bytes_after);
|
|
|
|
|
|
|
|
// remove the bytes of the data after the mutation point and the data for the children of the mutation node.
|
|
|
|
vals_r.pop_bytes(static_cast<blt::ptrdiff_t>(total_bytes_after + accumulate_type_sizes(begin_itr, end_itr)));
|
2024-07-08 22:20:51 -04:00
|
|
|
|
2024-08-06 02:46:01 -04:00
|
|
|
// insert the new tree then move back the data from after the original mutation point.
|
2024-08-04 22:07:41 -04:00
|
|
|
vals_r.insert(std::move(new_vals_r));
|
2024-08-06 02:46:01 -04:00
|
|
|
vals_r.copy_from(stack_after_data, total_bytes_after);
|
2024-07-08 22:20:51 -04:00
|
|
|
|
2024-08-03 13:16:53 -04:00
|
|
|
auto before = begin_itr - 1;
|
|
|
|
ops_r.erase(begin_itr, end_itr);
|
|
|
|
ops_r.insert(++before, new_ops_r.begin(), new_ops_r.end());
|
2024-08-05 02:40:16 -04:00
|
|
|
|
|
|
|
// this will check to make sure that the tree is in a correct and executable state. it requires that the evaluation is context free!
|
2024-08-02 21:08:34 -04:00
|
|
|
#if BLT_DEBUG_LEVEL >= 2
|
2024-08-03 21:26:39 -04:00
|
|
|
BLT_ASSERT(new_vals_r.empty());
|
2024-08-06 02:46:01 -04:00
|
|
|
//BLT_ASSERT(stack_after.empty());
|
2024-08-02 21:08:34 -04:00
|
|
|
blt::size_t bytes_expected = 0;
|
2024-08-03 13:16:53 -04:00
|
|
|
auto bytes_size = vals_r.size().total_used_bytes;
|
2024-08-02 21:08:34 -04:00
|
|
|
|
|
|
|
for (const auto& op : c.get_operations())
|
|
|
|
{
|
|
|
|
if (op.is_value)
|
|
|
|
bytes_expected += stack_allocator::aligned_size(op.type_size);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (bytes_expected != bytes_size)
|
|
|
|
{
|
2024-08-04 22:07:41 -04:00
|
|
|
BLT_WARN_STREAM << "Stack state: " << vals_r.size() << "\n";
|
|
|
|
BLT_WARN("Child tree bytes %ld vs expected %ld, difference: %ld", bytes_size, bytes_expected,
|
|
|
|
static_cast<blt::ptrdiff_t>(bytes_expected) - static_cast<blt::ptrdiff_t>(bytes_size));
|
2024-08-05 02:40:16 -04:00
|
|
|
BLT_TRACE("Total bytes after: %ld", total_bytes_after);
|
2024-08-02 21:08:34 -04:00
|
|
|
BLT_ABORT("Amount of bytes in stack doesn't match the number of bytes expected for the operations");
|
|
|
|
}
|
2024-08-03 13:16:53 -04:00
|
|
|
auto copy = c;
|
|
|
|
try
|
|
|
|
{
|
|
|
|
auto result = copy.evaluate(nullptr);
|
|
|
|
blt::black_box(result);
|
|
|
|
} catch (...)
|
|
|
|
{
|
2024-08-03 21:26:39 -04:00
|
|
|
std::cout << "This occurred at point " << begin_point << " ending at (old) " << end_point << "\n";
|
2024-08-04 22:07:41 -04:00
|
|
|
std::cout << "our root type is " << ops_r[begin_point].id << " with size " << stack_allocator::aligned_size(ops_r[begin_point].type_size)
|
|
|
|
<< "\n";
|
2024-08-03 21:26:39 -04:00
|
|
|
std::cout << "now Named: " << (program.get_name(ops_r[begin_point].id) ? *program.get_name(ops_r[begin_point].id) : "Unnamed") << "\n";
|
2024-08-04 19:43:59 -04:00
|
|
|
std::cout << "Was named: " << (program.get_name(begin_operator_id) ? *program.get_name(begin_operator_id) : "Unnamed") << "\n";
|
2024-08-03 21:26:39 -04:00
|
|
|
std::cout << "Parent:" << std::endl;
|
2024-08-03 13:16:53 -04:00
|
|
|
p.print(program, std::cout, false, true);
|
2024-08-03 21:26:39 -04:00
|
|
|
std::cout << "Child:" << std::endl;
|
2024-08-03 13:16:53 -04:00
|
|
|
c.print(program, std::cout, false, true);
|
2024-08-03 21:26:39 -04:00
|
|
|
std::cout << std::endl;
|
2024-08-03 13:16:53 -04:00
|
|
|
c.print(program, std::cout, true, true);
|
2024-08-03 21:26:39 -04:00
|
|
|
std::cout << std::endl;
|
2024-08-03 13:16:53 -04:00
|
|
|
throw std::exception();
|
|
|
|
}
|
2024-08-02 21:08:34 -04:00
|
|
|
#endif
|
2024-07-08 22:20:51 -04:00
|
|
|
|
|
|
|
return c;
|
|
|
|
}
|
2024-07-09 03:57:58 -04:00
|
|
|
|
2024-07-20 15:45:07 -04:00
|
|
|
blt::ptrdiff_t find_endpoint(blt::gp::gp_program& program, const std::vector<blt::gp::op_container_t>& container, blt::ptrdiff_t index)
|
|
|
|
{
|
|
|
|
blt::i64 children_left = 0;
|
|
|
|
|
|
|
|
do
|
|
|
|
{
|
|
|
|
const auto& type = program.get_operator_info(container[index].id);
|
|
|
|
// this is a child to someone
|
|
|
|
if (children_left != 0)
|
|
|
|
children_left--;
|
|
|
|
if (type.argc.argc > 0)
|
|
|
|
children_left += type.argc.argc;
|
|
|
|
index++;
|
|
|
|
} while (children_left > 0);
|
|
|
|
|
|
|
|
return index;
|
|
|
|
}
|
2024-06-27 03:01:39 -04:00
|
|
|
}
|