WasmOperator_8cpp_source.html

#include "backend/WasmOperator.hpp"


#include "backend/Interpreter.hpp"

#include "backend/WasmAlgo.hpp"

#include "backend/WasmMacro.hpp"

#include <mutable/catalog/Catalog.hpp>

#include <mutable/parse/AST.hpp>

#include <mutable/util/fn.hpp>

#include <numeric>


using namespace m;

using namespace m::ast;

using namespace m::storage;

using namespace m::wasm;


/*======================================================================================================================

 * CLI arguments

 *====================================================================================================================*/


namespace {


__attribute__((constructor(201)))

static void add_wasm_operator_args()

{

    Catalog &C = Catalog::Get();


    /*----- Command-line arguments -----*/

    C.arg_parser().add<std::vector<std::string_view>>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--scan-implementations",

        /* description= */ "a comma seperated list of physical scan implementations to consider (`Scan` or `IndexScan`)",

        /* callback=    */ [](std::vector<std::string_view> impls){

            options::scan_implementations = option_configs::ScanImplementation(0UL);

            for (const auto &elem : impls) {

                if (strneq(elem.data(), "Scan", elem.size()))

                    options::scan_implementations |= option_configs::ScanImplementation::SCAN;

                else if (strneq(elem.data(), "IndexScan", elem.size()))

                    options::scan_implementations |= option_configs::ScanImplementation::INDEX_SCAN;

                else

                    std::cerr << "warning: ignore invalid physical scan implementation " << elem << std::endl;

            }

        }

    );

    C.arg_parser().add<std::vector<std::string_view>>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--grouping-implementations",

        /* description= */ "a comma seperated list of physical grouping implementations to consider (`HashBased` or "

                           "`Ordered`)",

        /* callback=    */ [](std::vector<std::string_view> impls){

            options::grouping_implementations = option_configs::GroupingImplementation(0UL);

            for (const auto &elem : impls) {

                if (strneq(elem.data(), "HashBased", elem.size()))

                    options::grouping_implementations |= option_configs::GroupingImplementation::HASH_BASED;

                else if (strneq(elem.data(), "Ordered", elem.size()))

                    options::grouping_implementations |= option_configs::GroupingImplementation::ORDERED;

                else

                    std::cerr << "warning: ignore invalid physical grouping implementation " << elem << std::endl;

            }

        }

    );

    C.arg_parser().add<std::vector<std::string_view>>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--sorting-implementations",

        /* description= */ "a comma seperated list of physical sorting implementations to consider (`Quicksort` or "

                           "`NoOp`)",

        /* callback=    */ [](std::vector<std::string_view> impls){

            options::sorting_implementations = option_configs::SortingImplementation(0UL);

            for (const auto &elem : impls) {

                if (strneq(elem.data(), "Quicksort", elem.size()))

                    options::sorting_implementations |= option_configs::SortingImplementation::QUICKSORT;

                else if (strneq(elem.data(), "NoOp", elem.size()))

                    options::sorting_implementations |= option_configs::SortingImplementation::NOOP;

                else

                    std::cerr << "warning: ignore invalid physical sorting implementation " << elem << std::endl;

            }

        }

    );

    C.arg_parser().add<std::vector<std::string_view>>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--join-implementations",

        /* description= */ "a comma seperated list of physical join implementations to consider (`NestedLoops`, "

                           "`SimpleHash`, or `SortMerge`)",

        /* callback=    */ [](std::vector<std::string_view> impls){

            options::join_implementations = option_configs::JoinImplementation(0UL);

            for (const auto &elem : impls) {

                if (strneq(elem.data(), "NestedLoops", elem.size()))

                    options::join_implementations |= option_configs::JoinImplementation::NESTED_LOOPS;

                else if (strneq(elem.data(), "SimpleHash", elem.size()))

                    options::join_implementations |= option_configs::JoinImplementation::SIMPLE_HASH;

                else if (strneq(elem.data(), "SortMerge", elem.size()))

                    options::join_implementations |= option_configs::JoinImplementation::SORT_MERGE;

                else

                    std::cerr << "warning: ignore invalid physical join implementation " << elem << std::endl;

            }

        }

    );

    C.arg_parser().add<std::vector<std::string_view>>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--index-implementations",

        /* description= */ "a comma separated list of index implementations to consider for index scans (`Array`, or"

                           " `Rmi`)",

        /* callback=    */ [](std::vector<std::string_view> impls){

            options::index_implementations = option_configs::IndexImplementation(0UL);

            for (const auto &elem : impls) {

                if (strneq(elem.data(), "Array", elem.size()))

                    options::index_implementations |= option_configs::IndexImplementation::ARRAY;

                else if (strneq(elem.data(), "Rmi", elem.size()))

                    options::index_implementations |= option_configs::IndexImplementation::RMI;

                else

                    std::cerr << "warning: ignore invalid index implementation " << elem << std::endl;

            }

        }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--index-scan-strategy",

        /* description= */ "specify the index scan strategy (`Compilation`, `Interpretation`, or `Hybrid`)",

        /* callback=    */ [](const char *strategy){

            if (streq(strategy, "Compilation"))

                options::index_scan_strategy = option_configs::IndexScanStrategy::COMPILATION;

            else if (streq(strategy, "Interpretation"))

                options::index_scan_strategy = option_configs::IndexScanStrategy::INTERPRETATION;

            else if (streq(strategy, "Hybrid"))

                options::index_scan_strategy = option_configs::IndexScanStrategy::HYBRID;

            else

                std::cerr << "warning: ignore invalid index scan strategy " << strategy << std::endl;

        }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--index-scan-compilation-strategy",

        /* description= */ "specify the materialization strategy for index scans (`Callback` or `ExposedMemory`)",

        /* callback=    */ [](const char *strategy){

            if (streq(strategy, "Callback"))

                options::index_scan_compilation_strategy = option_configs::IndexScanCompilationStrategy::CALLBACK;

            else if (streq(strategy, "ExposedMemory"))

                options::index_scan_compilation_strategy = option_configs::IndexScanCompilationStrategy::EXPOSED_MEMORY;

            else

                std::cerr << "warning: ignore invalid index scan strategy " << strategy << std::endl;

        }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--index-scan-materialization-strategy",

        /* description= */ "specify the materialization strategy for index scans (`Inline` or `Memory`)",

        /* callback=    */ [](const char *strategy){

            if (streq(strategy, "Inline"))

                options::index_scan_materialization_strategy = option_configs::IndexScanMaterializationStrategy::INLINE;

            else if (streq(strategy, "Memory"))

                options::index_scan_materialization_strategy = option_configs::IndexScanMaterializationStrategy::MEMORY;

            else

                std::cerr << "warning: ignore invalid index scan strategy " << strategy << std::endl;

        }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--filter-selection-strategy",

        /* description= */ "specify the selection strategy for filters (`Branching` or `Predicated`)",

        /* callback=    */ [](const char *strategy){

            if (streq(strategy, "Branching"))

                options::filter_selection_strategy = option_configs::SelectionStrategy::BRANCHING;

            else if (streq(strategy, "Predicated"))

                options::filter_selection_strategy = option_configs::SelectionStrategy::PREDICATED;

            else

                std::cerr << "warning: ignore invalid filter selection strategy " << strategy << std::endl;

        }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--quicksort-cmp-selection-strategy",

        /* description= */ "specify the selection strategy for comparisons in quicksort (`Branching` or `Predicated`)",

        /* callback=    */ [](const char *strategy){

            if (streq(strategy, "Branching"))

                options::quicksort_cmp_selection_strategy = option_configs::SelectionStrategy::BRANCHING;

            else if (streq(strategy, "Predicated"))

                options::quicksort_cmp_selection_strategy = option_configs::SelectionStrategy::PREDICATED;

            else

                std::cerr << "warning: ignore invalid quicksort comparison selection strategy " << strategy << std::endl;

        }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--nested-loops-join-selection-strategy",

        /* description= */ "specify the selection strategy for nested-loops joins (`Branching` or `Predicated`)",

        /* callback=    */ [](const char *strategy){

            if (streq(strategy, "Branching"))

                options::nested_loops_join_selection_strategy = option_configs::SelectionStrategy::BRANCHING;

            else if (streq(strategy, "Predicated"))

                options::nested_loops_join_selection_strategy = option_configs::SelectionStrategy::PREDICATED;

            else

                std::cerr << "warning: ignore invalid nested-loops join selection strategy " << strategy << std::endl;

        }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--simple-hash-join-selection-strategy",

        /* description= */ "specify the selection strategy for simple hash joins (`Branching` or `Predicated`)",

        /* callback=    */ [](const char *strategy){

            if (streq(strategy, "Branching"))

                options::simple_hash_join_selection_strategy = option_configs::SelectionStrategy::BRANCHING;

            else if (streq(strategy, "Predicated"))

                options::simple_hash_join_selection_strategy = option_configs::SelectionStrategy::PREDICATED;

            else

                std::cerr << "warning: ignore invalid simple hash join selection strategy " << strategy << std::endl;

        }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--simple-hash-join-ordering-strategy",

        /* description= */ "specify the ordering strategy for simple hash joins (`BuildOnLeft` or `BuildOnRight`)",

        /* callback=    */ [](const char *strategy){

            if (streq(strategy, "BuildOnLeft"))

                options::simple_hash_join_ordering_strategy = option_configs::OrderingStrategy::BUILD_ON_LEFT;

            else if (streq(strategy, "BuildOnRight"))

                options::simple_hash_join_ordering_strategy = option_configs::OrderingStrategy::BUILD_ON_RIGHT;

            else

                std::cerr << "warning: ignore invalid simple hash join ordering strategy " << strategy << std::endl;

        }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--sort-merge-join-selection-strategy",

        /* description= */ "specify the selection strategy for sort merge joins (`Branching` or `Predicated`)",

        /* callback=    */ [](const char *strategy){

            if (streq(strategy, "Branching"))

                options::sort_merge_join_selection_strategy = option_configs::SelectionStrategy::BRANCHING;

            else if (streq(strategy, "Predicated"))

                options::sort_merge_join_selection_strategy = option_configs::SelectionStrategy::PREDICATED;

            else

                std::cerr << "warning: ignore invalid sort merge join selection strategy " << strategy << std::endl;

        }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--sort-merge-join-cmp-selection-strategy",

        /* description= */ "specify the selection strategy for comparisons while sorting in sort merge joins "

                           "(`Branching` or `Predicated`)",

        /* callback=    */ [](const char *strategy){

            if (streq(strategy, "Branching"))

                options::sort_merge_join_cmp_selection_strategy = option_configs::SelectionStrategy::BRANCHING;

            else if (streq(strategy, "Predicated"))

                options::sort_merge_join_cmp_selection_strategy = option_configs::SelectionStrategy::PREDICATED;

            else

                std::cerr << "warning: ignore invalid sort merge join comparison selection strategy " << strategy

                          << std::endl;

        }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--hash-table-implementation",

        /* description= */ "specify the hash table implementation (`OpenAddressing` or `Chained`)",

        /* callback=    */ [](const char *impl){

            if (streq(impl, "OpenAddressing"))

                options::hash_table_implementation = option_configs::HashTableImplementation::OPEN_ADDRESSING;

            else if (streq(impl, "Chained"))

                options::hash_table_implementation = option_configs::HashTableImplementation::CHAINED;

            else

                std::cerr << "warning: ignore invalid hash table implementation " << impl << std::endl;

        }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--hash-table-probing-strategy",

        /* description= */ "specify the probing strategy for hash tables (`Linear` or `Quadratic`)",

        /* callback=    */ [](const char *strategy){

            if (streq(strategy, "Linear"))

                options::hash_table_probing_strategy = option_configs::ProbingStrategy::LINEAR;

            else if (streq(strategy, "Quadratic"))

                options::hash_table_probing_strategy = option_configs::ProbingStrategy::QUADRATIC;

            else

                std::cerr << "warning: ignore invalid hash table probing strategy " << strategy << std::endl;

        }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--hash-table-storing-strategy",

        /* description= */ "specify the storing strategy for hash tables (`InPlace` or `OutOfPlace`)",

        /* callback=    */ [](const char *strategy){

            if (streq(strategy, "InPlace"))

                options::hash_table_storing_strategy = option_configs::StoringStrategy::IN_PLACE;

            else if (streq(strategy, "OutOfPlace"))

                options::hash_table_storing_strategy = option_configs::StoringStrategy::OUT_OF_PLACE;

            else

                std::cerr << "warning: ignore invalid hash table storing strategy " << strategy << std::endl;

        }

    );

    C.arg_parser().add<double>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--hash-table-max-load-factor",

        /* description= */ "specify the maximal load factor for hash tables, i.e. the load factor at which rehashing "

                           "should occur (must be in [1,∞) for chained and in [0.5,1) for open-addressing hash tables)",

        /* callback=    */ [](double load_factor){

            options::load_factor_open_addressing = load_factor;

            options::load_factor_chained = load_factor;

        }

    );

    C.arg_parser().add<double>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--hash-table-initial-capacity",

        /* description= */ "specify the initial capacity for hash tables",

        /* callback=    */ [](uint32_t initial_capacity){

            options::hash_table_initial_capacity = initial_capacity;

        }

    );

    C.arg_parser().add<bool>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--no-hash-based-group-join",

        /* description= */ "disable potential use of hash-based group-join",

        /* callback=    */ [](bool){ options::hash_based_group_join = false; }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--hard-pipeline-breaker-layout",

        /* description= */ "specify the layout for hard pipeline breakers (`Row`, `PAX4K`, `PAX64K`, `PAX512K`, "

                           "`PAX4M`, or `PAX64M`)",

        /* callback=    */ [](const char *layout){

            if (streq(layout, "Row")) {

                options::hard_pipeline_breaker_layout = std::make_unique<RowLayoutFactory>();

            } else {

                PAXLayoutFactory::block_size_t size_type;

                uint64_t block_size;

                if (streq(layout, "PAX4K")) {

                    size_type = PAXLayoutFactory::NBytes;

                    block_size = 1UL << 12;

                } else if (streq(layout, "PAX64K")) {

                    size_type = PAXLayoutFactory::NBytes;

                    block_size = 1UL << 16;

                } else if (streq(layout, "PAX512K")) {

                    size_type = PAXLayoutFactory::NBytes;

                    block_size = 1UL << 19;

                } else if (streq(layout, "PAX4M")) {

                    size_type = PAXLayoutFactory::NBytes;

                    block_size = 1UL << 22;

                } else if (streq(layout, "PAX64M")) {

                    size_type = PAXLayoutFactory::NBytes;

                    block_size = 1UL << 26;

                } else if (streq(layout, "PAX16Tup")) {

                    size_type = PAXLayoutFactory::NTuples;

                    block_size = 16;

                } else if (streq(layout, "PAX128Tup")) {

                    size_type = PAXLayoutFactory::NTuples;

                    block_size = 128;

                } else if (streq(layout, "PAX1024Tup")) {

                    size_type = PAXLayoutFactory::NTuples;

                    block_size = 1024;

                } else {

                    std::cerr << "warning: ignore invalid layout for hard pipeline breakers " << layout << std::endl;

                }

                options::hard_pipeline_breaker_layout = std::make_unique<PAXLayoutFactory>(size_type, block_size);

            }

        }

    );

    C.arg_parser().add<std::vector<std::string_view>>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--soft-pipeline-breaker",

        /* description= */ "a comma seperated list where to insert soft pipeline breakers (`AfterAll`, `AfterScan`, "

                           "`AfterFilter`, `AfterProjection`, `AfterNestedLoopsJoin`, or `AfterSimpleHashJoin`)",

        /* callback=    */ [](std::vector<std::string_view> location){

            options::soft_pipeline_breaker = option_configs::SoftPipelineBreakerStrategy(0UL);

            for (const auto &elem : location) {

                if (strneq(elem.data(), "AfterAll", elem.size()))

                    options::soft_pipeline_breaker |= option_configs::SoftPipelineBreakerStrategy::AFTER_ALL;

                else if (strneq(elem.data(), "AfterScan", elem.size()))

                    options::soft_pipeline_breaker |= option_configs::SoftPipelineBreakerStrategy::AFTER_SCAN;

                else if (strneq(elem.data(), "AfterFilter", elem.size()))

                    options::soft_pipeline_breaker |= option_configs::SoftPipelineBreakerStrategy::AFTER_FILTER;

                else if (strneq(elem.data(), "AfterIndexScan", elem.size()))

                    options::soft_pipeline_breaker |= option_configs::SoftPipelineBreakerStrategy::AFTER_INDEX_SCAN;

                else if (strneq(elem.data(), "AfterProjection", elem.size()))

                    options::soft_pipeline_breaker |= option_configs::SoftPipelineBreakerStrategy::AFTER_PROJECTION;

                else if (strneq(elem.data(), "AfterNestedLoopsJoin", elem.size()))

                    options::soft_pipeline_breaker |= option_configs::SoftPipelineBreakerStrategy::AFTER_NESTED_LOOPS_JOIN;

                else if (strneq(elem.data(), "AfterSimpleHashJoin", elem.size()))

                    options::soft_pipeline_breaker |= option_configs::SoftPipelineBreakerStrategy::AFTER_SIMPLE_HASH_JOIN;

                else

                    std::cerr << "warning: ignore invalid location for soft pipeline breakers " << elem << std::endl;

            }

        }

    );

    C.arg_parser().add<const char*>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--soft-pipeline-breaker-layout",

        /* description= */ "specify the layout for soft pipeline breakers (`Row`, `PAX4K`, `PAX64K`, `PAX512K`, "

                           "`PAX4M`, or `PAX64M`)",

        /* callback=    */ [](const char *layout){

            if (streq(layout, "Row")) {

                options::soft_pipeline_breaker_layout = std::make_unique<RowLayoutFactory>();

            } else {

                PAXLayoutFactory::block_size_t size_type;

                uint64_t block_size;

                if (streq(layout, "PAX4K")) {

                    size_type = PAXLayoutFactory::NBytes;

                    block_size = 1UL << 12;

                } else if (streq(layout, "PAX64K")) {

                    size_type = PAXLayoutFactory::NBytes;

                    block_size = 1UL << 16;

                } else if (streq(layout, "PAX512K")) {

                    size_type = PAXLayoutFactory::NBytes;

                    block_size = 1UL << 19;

                } else if (streq(layout, "PAX4M")) {

                    size_type = PAXLayoutFactory::NBytes;

                    block_size = 1UL << 22;

                } else if (streq(layout, "PAX64M")) {

                    size_type = PAXLayoutFactory::NBytes;

                    block_size = 1UL << 26;

                } else if (streq(layout, "PAX16Tup")) {

                    size_type = PAXLayoutFactory::NTuples;

                    block_size = 16;

                } else if (streq(layout, "PAX128Tup")) {

                    size_type = PAXLayoutFactory::NTuples;

                    block_size = 128;

                } else if (streq(layout, "PAX1024Tup")) {

                    size_type = PAXLayoutFactory::NTuples;

                    block_size = 1024;

                } else {

                    std::cerr << "warning: ignore invalid layout for soft pipeline breakers " << layout << std::endl;

                }

                options::soft_pipeline_breaker_layout = std::make_unique<PAXLayoutFactory>(size_type, block_size);

            }

        }

    );

    C.arg_parser().add<std::size_t>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--soft-pipeline-breaker-num-tuples",

        /* description= */ "set the size in tuples for soft pipeline breakers (0 means infinite)",

        /* callback=    */ [](std::size_t num_tuples){ options::soft_pipeline_breaker_num_tuples = num_tuples; }

    );

    C.arg_parser().add<std::size_t>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--index-sequential-scan-batch-size",

        /* description= */ "set the number of tuples ids communicated between host and V8 per batch during index "

                           "sequential scan"

                           "(0 means infinite), ignored in case of --isam-compile-qualifying",

        /* callback=    */ [](std::size_t size){ options::index_sequential_scan_batch_size = size; }

    );

    C.arg_parser().add<std::size_t>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--result-set-window-size",

        /* description= */ "set the window size in tuples for the result set (0 means infinite)",

        /* callback=    */ [](std::size_t size){ options::result_set_window_size = size; }

    );

    C.arg_parser().add<bool>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--no-exploit-unique-build",

        /* description= */ "disable potential exploitation of uniqueness of build key in hash joins",

        /* callback=    */ [](bool){ options::exploit_unique_build = false; }

    );

    C.arg_parser().add<bool>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--no-simd",

        /* description= */ "disable potential use of SIMDfication",

        /* callback=    */ [](bool){ options::simd = false; }

    );

    C.arg_parser().add<bool>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--no-double-pumping",

        /* description= */ "disable use of double pumping (has only an effect if SIMDfication is enabled)",

        /* callback=    */ [](bool){ options::double_pumping = false; }

    );

    C.arg_parser().add<std::size_t>(

        /* group=       */ "Wasm",

        /* short=       */ nullptr,

        /* long=        */ "--simd-lanes",

        /* description= */ "set the number of SIMD lanes to prefer",

        /* callback=    */ [](std::size_t lanes){ options::simd_lanes = lanes; }

    );

    C.arg_parser().add<std::vector<std::string_view>>(

        /* group=       */ "Hacks",

        /* short=       */ nullptr,

        /* long=        */ "--xxx-asc-sorted-attributes",

        /* description= */ "a comma seperated list of attributes, i.e. of the format `T.x` where `T` is either the "

                           "table name or the alias and `x` is the attribute name, which are assumed to be sorted "

                           "ascending",

        /* callback=    */ [&C](std::vector<std::string_view> attrs){

            for (const auto &elem : attrs) {

                auto idx = elem.find('.');

                if (idx == std::string_view::npos)

                    std::cerr << "warning: ignore invalid attribute " << elem << std::endl;

                Schema::Identifier attr(C.pool(elem.substr(0, idx)), C.pool(elem.substr(idx + 1)));

                options::sorted_attributes.emplace_back(std::move(attr), true);

            }

        }

    );

    C.arg_parser().add<std::vector<std::string_view>>(

        /* group=       */ "Hacks",

        /* short=       */ nullptr,

        /* long=        */ "--xxx-desc-sorted-attributes",

        /* description= */ "a comma seperated list of attributes, i.e. of the format `T.x` where `T` is either the "

                           "table name or the alias and `x` is the attribute name, which are assumed to be sorted "

                           "descending",

        /* callback=    */ [&C](std::vector<std::string_view> attrs){

            for (const auto &elem : attrs) {

                auto idx = elem.find('.');

                if (idx == std::string_view::npos)

                    std::cerr << "warning: ignore invalid attribute " << elem << std::endl;

                Schema::Identifier attr(C.pool(elem.substr(0, idx)), C.pool(elem.substr(idx + 1)));

                options::sorted_attributes.emplace_back(std::move(attr), false);

            }

        }

    );

}


}


/*======================================================================================================================

 * register_wasm_operators()

 *====================================================================================================================*/


void m::register_wasm_operators(PhysicalOptimizer &phys_opt)

{

    phys_opt.register_operator<NoOp>();

    phys_opt.register_operator<Callback<false>>();

    phys_opt.register_operator<Callback<true>>();

    phys_opt.register_operator<Print<false>>();

    phys_opt.register_operator<Print<true>>();

    if (bool(options::scan_implementations bitand option_configs::ScanImplementation::SCAN)) {

        phys_opt.register_operator<Scan<false>>();

        if (options::simd)

            phys_opt.register_operator<Scan<true>>();

    }

    if (bool(options::scan_implementations bitand option_configs::ScanImplementation::INDEX_SCAN)) {

        if (bool(options::index_implementations bitand option_configs::IndexImplementation::ARRAY))

            phys_opt.register_operator<IndexScan<idx::IndexMethod::Array>>();

        if (bool(options::index_implementations bitand option_configs::IndexImplementation::RMI))

            phys_opt.register_operator<IndexScan<idx::IndexMethod::Rmi>>();

    }

    if (bool(options::filter_selection_strategy bitand option_configs::SelectionStrategy::BRANCHING))

        phys_opt.register_operator<Filter<false>>();

    if (bool(options::filter_selection_strategy bitand option_configs::SelectionStrategy::PREDICATED))

        phys_opt.register_operator<Filter<true>>();

    phys_opt.register_operator<LazyDisjunctiveFilter>();

    phys_opt.register_operator<Projection>();

    if (bool(options::grouping_implementations bitand option_configs::GroupingImplementation::HASH_BASED))

        phys_opt.register_operator<HashBasedGrouping>();

    if (bool(options::grouping_implementations bitand option_configs::GroupingImplementation::ORDERED))

        phys_opt.register_operator<OrderedGrouping>();

    phys_opt.register_operator<Aggregation>();

    if (bool(options::sorting_implementations bitand option_configs::SortingImplementation::QUICKSORT)) {

        if (bool(options::quicksort_cmp_selection_strategy bitand option_configs::SelectionStrategy::BRANCHING))

            phys_opt.register_operator<Quicksort<false>>();

        if (bool(options::quicksort_cmp_selection_strategy bitand option_configs::SelectionStrategy::PREDICATED))

            phys_opt.register_operator<Quicksort<true>>();

    }

    if (bool(options::sorting_implementations bitand option_configs::SortingImplementation::NOOP))

        phys_opt.register_operator<NoOpSorting>();

    if (bool(options::join_implementations bitand option_configs::JoinImplementation::NESTED_LOOPS)) {

        if (bool(options::nested_loops_join_selection_strategy bitand option_configs::SelectionStrategy::BRANCHING))

            phys_opt.register_operator<NestedLoopsJoin<false>>();

        if (bool(options::nested_loops_join_selection_strategy bitand option_configs::SelectionStrategy::PREDICATED))

            phys_opt.register_operator<NestedLoopsJoin<true>>();

    }

    if (bool(options::join_implementations bitand option_configs::JoinImplementation::SIMPLE_HASH)) {

        if (bool(options::simple_hash_join_selection_strategy bitand option_configs::SelectionStrategy::BRANCHING)) {

            phys_opt.register_operator<SimpleHashJoin<false, false>>();

            if (options::exploit_unique_build)

                phys_opt.register_operator<SimpleHashJoin<true,  false>>();

        }

        if (bool(options::simple_hash_join_selection_strategy bitand option_configs::SelectionStrategy::PREDICATED)) {

            phys_opt.register_operator<SimpleHashJoin<false, true>>();

            if (options::exploit_unique_build)

                phys_opt.register_operator<SimpleHashJoin<true,  true>>();

        }

    }

    if (bool(options::join_implementations bitand option_configs::JoinImplementation::SORT_MERGE)) {

        if (bool(options::sort_merge_join_selection_strategy bitand option_configs::SelectionStrategy::BRANCHING)) {

            if (bool(options::sort_merge_join_cmp_selection_strategy bitand option_configs::SelectionStrategy::BRANCHING)) {

                phys_opt.register_operator<SortMergeJoin<false, false, false, false>>();

                phys_opt.register_operator<SortMergeJoin<false, true,  false, false>>();

                phys_opt.register_operator<SortMergeJoin<true,  false, false, false>>();

                phys_opt.register_operator<SortMergeJoin<true,  true,  false, false>>();

            }

            if (bool(options::sort_merge_join_cmp_selection_strategy bitand option_configs::SelectionStrategy::PREDICATED)) {

                phys_opt.register_operator<SortMergeJoin<false, false, false, true>>();

                phys_opt.register_operator<SortMergeJoin<false, true,  false, true>>();

                phys_opt.register_operator<SortMergeJoin<true,  false, false, true>>();

                phys_opt.register_operator<SortMergeJoin<true,  true,  false, true>>();

            }

        }

        if (bool(options::sort_merge_join_selection_strategy bitand option_configs::SelectionStrategy::PREDICATED)) {

            if (bool(options::sort_merge_join_cmp_selection_strategy bitand option_configs::SelectionStrategy::BRANCHING)) {

                phys_opt.register_operator<SortMergeJoin<false, false, true, false>>();

                phys_opt.register_operator<SortMergeJoin<false, true,  true, false>>();

                phys_opt.register_operator<SortMergeJoin<true,  false, true, false>>();

                phys_opt.register_operator<SortMergeJoin<true,  true,  true, false>>();

            }

            if (bool(options::sort_merge_join_cmp_selection_strategy bitand option_configs::SelectionStrategy::PREDICATED)) {

                phys_opt.register_operator<SortMergeJoin<false, false, true, true>>();

                phys_opt.register_operator<SortMergeJoin<false, true,  true, true>>();

                phys_opt.register_operator<SortMergeJoin<true,  false, true, true>>();

                phys_opt.register_operator<SortMergeJoin<true,  true,  true, true>>();

            }

        }

    }

    phys_opt.register_operator<Limit>();

    if (options::hash_based_group_join)

        phys_opt.register_operator<HashBasedGroupJoin>();

}


/*======================================================================================================================

 * Helper structs and functions

 *====================================================================================================================*/


void write_result_set(const Schema &schema, const DataLayoutFactory &factory, uint32_t window_size,

                      const m::wasm::MatchBase &child)

{

    M_insist(schema == schema.drop_constants().deduplicate(), "schema must not contain constants or duplicates");

    M_insist(CodeGenContext::Get().env().empty(), "all environment entries must be used");


    /*----- Set data layout factory used for the result set. -----*/

    auto &context = WasmEngine::Get_Wasm_Context_By_ID(Module::ID());

    context.result_set_factory = factory.clone();


    if (schema.num_entries() == 0) { // result set contains only NULL constants

        if (window_size != 0) { // i.e. result set is materialized only partially

            M_insist(window_size >= CodeGenContext::Get().num_simd_lanes());

            M_insist(window_size % CodeGenContext::Get().num_simd_lanes() == 0);


            std::optional<Var<U32x1>> counter;

            Global<U32x1> counter_backup; // default initialized to 0


            /*----- Create child function s.t. result set is extracted in case of returns (e.g. due to `Limit`). -----*/

            FUNCTION(child_pipeline, void(void))

            {

                auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function


                child.execute(

                    /* setup=    */ setup_t::Make_Without_Parent([&](){ counter.emplace(counter_backup); }),

                    /* pipeline= */ [&](){

                        M_insist(bool(counter));


                        /*----- Increment tuple ID. -----*/

                        if (auto &env = CodeGenContext::Get().env(); env.predicated()) {

                            M_insist(CodeGenContext::Get().num_simd_lanes() == 1,

                                     "SIMDfication with predication not supported");

                            *counter += env.extract_predicate<_Boolx1>().is_true_and_not_null().to<uint32_t>();

                        } else {

                            *counter += uint32_t(CodeGenContext::Get().num_simd_lanes());

                        }


                        /*----- If window size is reached, update result size, extract current results, and reset tuple ID. */

                        IF (*counter == window_size) {

                            CodeGenContext::Get().inc_num_tuples(U32x1(window_size));

                            Module::Get().emit_call<void>("read_result_set", Ptr<void>::Nullptr(), U32x1(window_size));

                            *counter = 0U;

                        };

                    },

                    /* teardown= */ teardown_t::Make_Without_Parent([&](){

                        M_insist(bool(counter));

                        counter_backup = *counter;

                        counter.reset();

                    })

                );

            }

            child_pipeline(); // call child function


            /*----- Update number of result tuples. -----*/

            CodeGenContext::Get().inc_num_tuples(counter_backup);


            /*----- Extract remaining results. -----*/

            Module::Get().emit_call<void>("read_result_set", Ptr<void>::Nullptr(), counter_backup.val());

        } else { // i.e. result set is materialized entirely

            /*----- Create child function s.t. result set is extracted in case of returns (e.g. due to `Limit`). -----*/

            FUNCTION(child_pipeline, void(void))

            {

                auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function


                std::optional<Var<U32x1>> num_tuples;


                child.execute(

                    /* setup=    */ setup_t::Make_Without_Parent([&](){

                        num_tuples.emplace(CodeGenContext::Get().num_tuples());

                    }),

                    /* pipeline= */ [&](){

                        M_insist(bool(num_tuples));

                        if (auto &env = CodeGenContext::Get().env(); env.predicated()) {

                            M_insist(CodeGenContext::Get().num_simd_lanes() == 1,

                                     "SIMDfication with predication not supported");

                            *num_tuples += env.extract_predicate<_Boolx1>().is_true_and_not_null().to<uint32_t>();

                        } else {

                            *num_tuples += uint32_t(CodeGenContext::Get().num_simd_lanes());

                        }

                    },

                    /* teardown= */ teardown_t::Make_Without_Parent([&](){

                        M_insist(bool(num_tuples));

                        CodeGenContext::Get().set_num_tuples(*num_tuples);

                        num_tuples.reset();

                    })

                );

            }

            child_pipeline(); // call child function


            /*----- Extract all results at once. -----*/

            Module::Get().emit_call<void>("read_result_set", Ptr<void>::Nullptr(), CodeGenContext::Get().num_tuples());

        }

    } else { // result set contains contains actual values

        if (window_size != 0) { // i.e. result set is materialized only partially

            M_insist(window_size > CodeGenContext::Get().num_simd_lanes());

            M_insist(window_size % CodeGenContext::Get().num_simd_lanes() == 0);


            /*----- Create finite global buffer (without `pipeline`-callback) used as reusable result set. -----*/

            GlobalBuffer result_set(schema, factory, false, window_size); // no callback to extract windows manually


            /*----- Create child function s.t. result set is extracted in case of returns (e.g. due to `Limit`). -----*/

            FUNCTION(child_pipeline, void(void))

            {

                auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function


                child.execute(

                    /* setup=    */ setup_t::Make_Without_Parent([&](){ result_set.setup(); }),

                    /* pipeline= */ [&](){

                        /*----- Store whether only a single slot is free to not extract result for empty buffer. -----*/

                        const Var<Boolx1> single_slot_free(

                            result_set.size() == window_size - uint32_t(CodeGenContext::Get().num_simd_lanes())

                        );


                        /*----- Write the result. -----*/

                        result_set.consume(); // also resets size to 0 in case buffer has reached window size


                        /*----- If the last buffer slot was filled, update result size and extract current results. */

                        IF (single_slot_free and result_set.size() == 0U) {

                            CodeGenContext::Get().inc_num_tuples(U32x1(window_size));

                            Module::Get().emit_call<void>("read_result_set", result_set.base_address(),

                                                          U32x1(window_size));

                        };

                    },

                    /* teardown= */ teardown_t::Make_Without_Parent([&](){ result_set.teardown(); })

                );

            }

            child_pipeline(); // call child function


            /*----- Update number of result tuples. -----*/

            CodeGenContext::Get().inc_num_tuples(result_set.size());


            /*----- Extract remaining results. -----*/

            Module::Get().emit_call<void>("read_result_set", result_set.base_address(), result_set.size());

        } else { // i.e. result set is materialized entirely

            /*----- Create infinite global buffer (without `pipeline`-callback) used as single result set. -----*/

            GlobalBuffer result_set(schema, factory); // no callback to extract results all at once


            /*----- Create child function s.t. result set is extracted in case of returns (e.g. due to `Limit`). -----*/

            FUNCTION(child_pipeline, void(void))

            {

                auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function


                child.execute(

                    /* setup=    */ setup_t::Make_Without_Parent([&](){ result_set.setup(); }),

                    /* pipeline= */ [&](){ result_set.consume(); },

                    /* teardown= */ teardown_t::Make_Without_Parent([&](){ result_set.teardown(); })

                );

            }

            child_pipeline(); // call child function


            /*----- Set number of result tuples. -----*/

            CodeGenContext::Get().inc_num_tuples(result_set.size()); // not inside child function due to predication


            /*----- Extract all results at once. -----*/

            Module::Get().emit_call<void>("read_result_set", result_set.base_address(), result_set.size());

        }

    }

}


struct aggregate_info_t

{

    Schema::entry_type entry;

    m::Function::fnid_t fnid;

    const std::vector<std::unique_ptr<ast::Expr>> &args;

};


struct avg_aggregate_info_t

{

    Schema::Identifier running_count;

    Schema::Identifier sum;

    bool compute_running_avg;

};


std::pair<std::vector<aggregate_info_t>, std::unordered_map<Schema::Identifier, avg_aggregate_info_t>>

compute_aggregate_info(const std::vector<std::reference_wrapper<const FnApplicationExpr>> &aggregates,

                       const Schema &schema, std::size_t aggregates_offset = 0)

{

    std::vector<aggregate_info_t> aggregates_info;

    std::unordered_map<Schema::Identifier, avg_aggregate_info_t> avg_aggregates_info;


    for (std::size_t i = aggregates_offset; i < schema.num_entries(); ++i) {

        auto &e = schema[i];


        auto pred = [&e](const auto &info){ return info.entry.id == e.id; };

        if (auto it = std::find_if(aggregates_info.cbegin(), aggregates_info.cend(), pred); it != aggregates_info.cend())

            continue; // duplicated aggregate


        auto &fn_expr = aggregates[i - aggregates_offset].get();

        auto &fn = fn_expr.get_function();

        M_insist(fn.kind == m::Function::FN_Aggregate, "not an aggregation function");


        if (fn.fnid == m::Function::FN_AVG) {

            M_insist(fn_expr.args.size() == 1, "AVG aggregate function expects exactly one argument");


            /*----- Insert a suitable running count, i.e. COUNT over the argument of the AVG aggregate. -----*/

            auto pred = [&fn_expr](const auto &_fn_expr){

                M_insist(_fn_expr.get().get_function().fnid != m::Function::FN_COUNT or _fn_expr.get().args.size() <= 1,

                         "COUNT aggregate function expects exactly one argument");

                return _fn_expr.get().get_function().fnid == m::Function::FN_COUNT and

                       not _fn_expr.get().args.empty() and *_fn_expr.get().args[0] == *fn_expr.args[0];

            };

            std::optional<Schema::Identifier> running_count;

            if (auto it = std::find_if(aggregates.cbegin(), aggregates.cend(), pred);

                it != aggregates.cend())

            { // reuse found running count

                const auto idx_agg = std::distance(aggregates.cbegin(), it);

                running_count = schema[aggregates_offset + idx_agg].id;

            } else { // insert additional running count

                std::ostringstream oss;

                oss << "$running_count_" << fn_expr;

                running_count = Schema::Identifier(Catalog::Get().pool(oss.str().c_str()));

                aggregates_info.emplace_back(aggregate_info_t{

                    .entry = { *running_count, Type::Get_Integer(Type::TY_Scalar, 8), Schema::entry_type::NOT_NULLABLE },

                    .fnid = m::Function::FN_COUNT,

                    .args = fn_expr.args

                });

            }


            /*----- Decide how to compute the average aggregate and insert sum aggregate accordingly. -----*/

            std::optional<Schema::Identifier> sum;

            bool compute_running_avg;

            if (fn_expr.args[0]->type()->size() <= 32) {

                /* Compute average by summing up all values in a 64-bit field (thus no overflows should occur) and

                 * dividing by the running count once at the end. */

                compute_running_avg = false;

                auto pred = [&fn_expr](const auto &_fn_expr){

                    M_insist(_fn_expr.get().get_function().fnid != m::Function::FN_SUM or

                             _fn_expr.get().args.size() == 1,

                             "SUM aggregate function expects exactly one argument");

                    return _fn_expr.get().get_function().fnid == m::Function::FN_SUM and

                           *_fn_expr.get().args[0] == *fn_expr.args[0];

                };

                if (auto it = std::find_if(aggregates.cbegin(), aggregates.cend(), pred);

                    it != aggregates.cend())

                { // reuse found SUM aggregate

                    const auto idx_agg = std::distance(aggregates.cbegin(), it);

                    sum = schema[aggregates_offset + idx_agg].id;

                } else { // insert additional SUM aggregate

                    std::ostringstream oss;

                    oss << "$sum_" << fn_expr;

                    sum = Schema::Identifier(Catalog::Get().pool(oss.str().c_str()));

                    const Type *type;

                    switch (as<const Numeric>(*fn_expr.args[0]->type()).kind) {

                        case Numeric::N_Int:

                        case Numeric::N_Decimal:

                            type = Type::Get_Integer(Type::TY_Scalar, 8);

                            break;

                        case Numeric::N_Float:

                            type = Type::Get_Double(Type::TY_Scalar);

                    }

                    aggregates_info.emplace_back(aggregate_info_t{

                        .entry = { *sum, type, e.constraints },

                        .fnid = m::Function::FN_SUM,

                        .args = fn_expr.args

                    });

                }

            } else {

                /* Compute average by computing a running average for each inserted value in a `_Doublex1` field (since

                 * the sum may overflow). */

                compute_running_avg = true;

                M_insist(e.type->is_double());

                aggregates_info.emplace_back(aggregate_info_t{

                    .entry = e,

                    .fnid = m::Function::FN_AVG,

                    .args = fn_expr.args

                });

            }


            /*----- Add info for this AVG aggregate. -----*/

            avg_aggregates_info.try_emplace(e.id, avg_aggregate_info_t{

                .running_count = std::move(*running_count),

                .sum = std::move(*sum),

                .compute_running_avg = compute_running_avg

            });

        } else {

            aggregates_info.emplace_back(aggregate_info_t{

                .entry = e,

                .fnid = fn.fnid,

                .args = fn_expr.args

            });

        }

    }


    return { std::move(aggregates_info), std::move(avg_aggregates_info) };

}


std::pair<std::vector<Schema::Identifier>, std::vector<Schema::Identifier>>

decompose_equi_predicate(const cnf::CNF &cnf, const Schema &schema_left)

{

    std::vector<Schema::Identifier> ids_left, ids_right;

    for (auto &clause : cnf) {

        M_insist(clause.size() == 1, "invalid equi-predicate");

        auto &literal = clause[0];

        auto &binary = as<const BinaryExpr>(literal.expr());

        M_insist((not literal.negative() and binary.tok == TK_EQUAL) or

                 (literal.negative() and binary.tok == TK_BANG_EQUAL), "invalid equi-predicate");

        M_insist(is<const Designator>(binary.lhs), "invalid equi-predicate");

        M_insist(is<const Designator>(binary.rhs), "invalid equi-predicate");

        Schema::Identifier id_first(*binary.lhs), id_second(*binary.rhs);

        const auto &[id_left, id_right] = schema_left.has(id_first) ? std::make_pair(id_first, id_second)

                                                                    : std::make_pair(id_second, id_first);

        ids_left.push_back(std::move(id_left));

        ids_right.push_back(std::move(id_right));

    }

    M_insist(ids_left.size() == ids_right.size(), "number of found IDs differ");

    M_insist(not ids_left.empty(), "must find at least one ID");

    return { std::move(ids_left), std::move(ids_right) };

}


U32x1 get_num_rows(const ThreadSafePooledString &table_name) {

    static std::ostringstream oss;

    oss.str("");

    oss << table_name << "_num_rows";

    return Module::Get().get_global<uint32_t>(oss.str().c_str());

}


Ptr<void> get_base_address(const ThreadSafePooledString &table_name) {

    static std::ostringstream oss;

    oss.str("");

    oss << table_name << "_mem";

    return Module::Get().get_global<void*>(oss.str().c_str());

}


U32x1 get_array_index_num_entries(const ThreadSafePooledString &table_name, const ThreadSafePooledString &attr_name) {

    static std::ostringstream oss;

    oss.str("");

    oss << "index_" << table_name << '_' << attr_name << "_array" << "_num_entries";

    return Module::Get().get_global<uint32_t>(oss.str().c_str());

}


Ptr<void> get_array_index_base_address(const ThreadSafePooledString &table_name, const ThreadSafePooledString &attr_name) {

    static std::ostringstream oss;

    oss.str("");

    oss << "index_" << table_name << '_' << attr_name << "_array" << "_mem";

    return Module::Get().get_global<void*>(oss.str().c_str());

}


uint32_t compute_initial_ht_capacity(const Operator &op, double load_factor) {

    uint64_t initial_capacity;

    if (options::hash_table_initial_capacity) {

        initial_capacity = *options::hash_table_initial_capacity;

    } else {

        if (op.has_info())

            initial_capacity = static_cast<uint64_t>(std::ceil(op.info().estimated_cardinality / load_factor));

        else if (auto scan = cast<const ScanOperator>(&op))

            initial_capacity = static_cast<uint64_t>(std::ceil(scan->store().num_rows() / load_factor));

        else

            initial_capacity = 1024; // fallback

    }

    return std::in_range<uint32_t>(initial_capacity) ? initial_capacity : std::numeric_limits<uint32_t>::max();

}


struct index_scan_bounds_t

{

    Schema::entry_type attribute = Schema::entry_type::CreateArtificial();

    std::optional<std::reference_wrapper<const ast::Expr>> lo, hi;

    bool is_inclusive_lo, is_inclusive_hi;

};


bool is_valid_bound(const ast::Expr &expr) {

    if (is<const Constant>(expr))

        return true;

    if (auto u = cast<const UnaryExpr>(&expr)) {

        /* `UnaryExpr` must be followed by `Constant`. */

        if ((u->op().type == TK_MINUS or u->op().type == TK_PLUS) and is<const Constant>(*u->expr))

            return true;

    }

    return false;

}


std::pair<const Constant&, bool> get_valid_bound(const ast::Expr &expr) {

    M_insist(is_valid_bound(expr), "bound must be valid");

    if (auto c = cast<const Constant>(&expr))

        return { *c, false };

    auto &u = as<const UnaryExpr>(expr);

    return { as<const Constant>(*u.expr), u.op().type == TK_MINUS };

}


index_scan_bounds_t extract_index_scan_bounds(const cnf::CNF &cnf)

{

    index_scan_bounds_t bounds;


    M_insist(not cnf.empty(), "filter condition must not be empty");

    auto designators = cnf.get_required();

    M_insist(designators.num_entries() == 1, "filter condition must contain exactly one designator");

    bounds.attribute = designators[0];


    for (auto &clause : cnf) {

        M_insist(clause.size() == 1, "invalid predicate");

        auto &literal = clause[0];

        auto &binary = as<const BinaryExpr>(literal.expr());

        M_insist((is<const Designator>(binary.lhs) and is_valid_bound(*binary.rhs)) or

                 (is<const Designator>(binary.rhs) and is_valid_bound(*binary.lhs)), "invalid predicate");

        bool has_attribute_left = is<const Designator>(binary.lhs);

        auto &bound = has_attribute_left ? *binary.rhs : *binary.lhs;


        switch(binary.tok.type) {

            default:

                M_unreachable("unsupported token type");

            case TK_EQUAL:

                M_insist(not bool(bounds.lo) and not bool(bounds.hi), "bound already set");

                bounds.lo = bounds.hi = std::cref(bound);

                bounds.is_inclusive_lo = bounds.is_inclusive_hi = true;

                break;

            case TK_GREATER:

                if (has_attribute_left) {

                    M_insist(not bool(bounds.lo), "lo bound already set");

                    bounds.lo = std::cref(bound);

                    bounds.is_inclusive_lo = false;

                } else {

                    M_insist(not bool(bounds.hi), "hi bound already set");

                    bounds.hi = std::cref(bound);

                    bounds.is_inclusive_hi = false;

                }

                break;

            case TK_GREATER_EQUAL:

                if (has_attribute_left) {

                    M_insist(not bool(bounds.lo), "lo bound already set");

                    bounds.lo = std::cref(bound);

                    bounds.is_inclusive_lo = true;

                } else {

                    M_insist(not bool(bounds.hi), "hi bound already set");

                    bounds.hi = std::cref(bound);

                    bounds.is_inclusive_hi = true;

                }

                break;

            case TK_LESS:

                if (has_attribute_left) {

                    M_insist(not bool(bounds.hi), "hi bound already set");

                    bounds.hi = std::cref(bound);

                    bounds.is_inclusive_hi = false;

                } else {

                    M_insist(not bool(bounds.lo), "lo bound already set");

                    bounds.lo = std::cref(bound);

                    bounds.is_inclusive_lo = false;

                }

                break;

            case TK_LESS_EQUAL:

                if (has_attribute_left) {

                    M_insist(not bool(bounds.hi), "hi bound already set");

                    bounds.hi = std::cref(bound);

                    bounds.is_inclusive_hi = true;

                } else {

                    M_insist(not bool(bounds.lo), "lo bound already set");

                    bounds.lo = std::cref(bound);

                    bounds.is_inclusive_lo = true;

                }

                break;

        }

    }

    M_insist(bool(bounds.lo) or bool(bounds.hi), "either bound must be set");

    return bounds;

}


/*======================================================================================================================

 * NoOp

 *====================================================================================================================*/


void NoOp::execute(const Match<NoOp> &M, setup_t, pipeline_t, teardown_t)

{

    std::optional<Var<U32x1>> num_tuples;


    M.child->execute(

        /* setup=    */ setup_t::Make_Without_Parent([&](){ num_tuples.emplace(CodeGenContext::Get().num_tuples()); }),

        /* pipeline= */ [&](){

            M_insist(bool(num_tuples));

            if (auto &env = CodeGenContext::Get().env(); env.predicated()) {

                switch (CodeGenContext::Get().num_simd_lanes()) {

                    default: M_unreachable("invalid number of simd lanes");

                    case  1: {

                        *num_tuples += env.extract_predicate<_Boolx1>().is_true_and_not_null().to<uint32_t>();

                        break;

                    }

                    case 16: {

                        auto pred = env.extract_predicate<_Boolx16>().is_true_and_not_null();

                        *num_tuples += pred.bitmask().popcnt();

                        break;

                    }

                }

            } else {

                *num_tuples += uint32_t(CodeGenContext::Get().num_simd_lanes());

            }

        },

        /* teardown= */ teardown_t::Make_Without_Parent([&](){

            M_insist(bool(num_tuples));

            CodeGenContext::Get().set_num_tuples(*num_tuples);

            num_tuples.reset();

        })

    );

}


/*======================================================================================================================

 * Callback

 *====================================================================================================================*/


template<bool SIMDfied>

ConditionSet Callback<SIMDfied>::pre_condition(std::size_t child_idx, const std::tuple<const CallbackOperator*>&)

{

     M_insist(child_idx == 0);


    ConditionSet pre_cond;


    if constexpr (SIMDfied) {

        /*----- SIMDfied callback supports SIMD but not predication. -----*/

        pre_cond.add_condition(Predicated(false));

    } else {

        /*----- Non-SIMDfied callback does not support SIMD. -----*/

        pre_cond.add_condition(NoSIMD());

    }


    return pre_cond;

}


template<bool SIMDfied>

void Callback<SIMDfied>::execute(const Match<Callback> &M, setup_t, pipeline_t, teardown_t)

{

    M_insist(bool(M.result_set_factory), "`wasm::Callback` must have a factory for the result set");


    auto result_set_schema = M.callback.schema().drop_constants().deduplicate();

    write_result_set(result_set_schema, *M.result_set_factory, M.result_set_window_size, *M.child);

}


/*======================================================================================================================

 * Print

 *====================================================================================================================*/


template<bool SIMDfied>

ConditionSet Print<SIMDfied>::pre_condition(std::size_t child_idx, const std::tuple<const PrintOperator*>&)

{

     M_insist(child_idx == 0);


    ConditionSet pre_cond;


    if constexpr (SIMDfied) {

        /*----- SIMDfied print supports SIMD but not predication. -----*/

        pre_cond.add_condition(Predicated(false));

    } else {

        /*----- Non-SIMDfied print does not support SIMD. -----*/

        pre_cond.add_condition(NoSIMD());

    }


    return pre_cond;

}


template<bool SIMDfied>

void Print<SIMDfied>::execute(const Match<Print> &M, setup_t, pipeline_t, teardown_t)

{

    M_insist(bool(M.result_set_factory), "`wasm::Print` must have a factory for the result set");


    auto result_set_schema = M.print_op.schema().drop_constants().deduplicate();

    write_result_set(result_set_schema, *M.result_set_factory, M.result_set_window_size, *M.child);

}


/*======================================================================================================================

 * Scan

 *====================================================================================================================*/


template<bool SIMDfied>

ConditionSet Scan<SIMDfied>::pre_condition(std::size_t child_idx,

                                           const std::tuple<const ScanOperator*> &partial_inner_nodes)

{

     M_insist(child_idx == 0);


    ConditionSet pre_cond;


    if constexpr (SIMDfied) {

        auto &scan = *std::get<0>(partial_inner_nodes);

        auto &table = scan.store().table();


        /*----- SIMDfied scan needs the data layout to support SIMD. -----*/

        if (not supports_simd(table.layout(), table.schema(scan.alias()), scan.schema()))

            return ConditionSet::Make_Unsatisfiable();


        /*----- SIMDfied scan needs the number of rows to load be a whole multiple of the number of SIMD lanes used. -*/

        if (scan.store().num_rows() % get_num_simd_lanes(table.layout(), table.schema(scan.alias()), scan.schema()) != 0)

            return ConditionSet::Make_Unsatisfiable();

    }


    return pre_cond;

}


template<bool SIMDfied>

ConditionSet Scan<SIMDfied>::post_condition(const Match<Scan> &M)

{

    ConditionSet post_cond;


    /*----- Scan does not introduce predication. -----*/

    post_cond.add_condition(Predicated(false));


    if constexpr (SIMDfied) {

        /*----- SIMDfied scan introduces SIMD vectors with respective number of lanes. -----*/

        auto &table = M.scan.store().table();

        const auto num_simd_lanes = get_num_simd_lanes(table.layout(), table.schema(M.scan.alias()), M.scan.schema());

        post_cond.add_condition(SIMD(num_simd_lanes));

    } else {

        /*----- Non-SIMDfied scan does not introduce SIMD. -----*/

        post_cond.add_condition(NoSIMD());

    }


    /*----- Check if any attribute of scanned table is assumed to be sorted. -----*/

    Sortedness::order_t orders;

    for (auto &e : M.scan.schema()) {

        auto pred = [&e](const auto &p){ return e.id == p.first; };

        if (auto it = std::find_if(options::sorted_attributes.cbegin(), options::sorted_attributes.cend(), pred);

            it != options::sorted_attributes.cend())

        {

            orders.add(e.id, it->second ? Sortedness::O_ASC : Sortedness::O_DESC);

        }

    }

    if (not orders.empty())

        post_cond.add_condition(Sortedness(std::move(orders)));


    return post_cond;

}


template<bool SIMDfied>

void Scan<SIMDfied>::execute(const Match<Scan> &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)

{

    auto &schema = M.scan.schema();

    auto &table = M.scan.store().table();


    M_insist(schema == schema.drop_constants().deduplicate(), "schema of `ScanOperator` must not contain NULL or duplicates");

    M_insist(not table.layout().is_finite(), "layout for `wasm::Scan` must be infinite");


    Var<U32x1> tuple_id; // default initialized to 0


    /*----- Compute possible number of SIMD lanes and decide which to use with regard to other operators preferences. */

    const auto layout_schema = table.schema(M.scan.alias());

    CodeGenContext::Get().update_num_simd_lanes_preferred(options::simd_lanes); // set configured preference

    const auto num_simd_lanes_preferred =

        CodeGenContext::Get().num_simd_lanes_preferred(); // get other operators preferences

    const std::size_t num_simd_lanes =

        SIMDfied ? (options::double_pumping ? 2 : 1)

                    * std::max(num_simd_lanes_preferred, get_num_simd_lanes(table.layout(), layout_schema, schema))

                 : 1;

    CodeGenContext::Get().set_num_simd_lanes(num_simd_lanes);


    /*----- Import the number of rows of `table`. -----*/

    U32x1 num_rows = get_num_rows(table.name());


    /*----- If no attributes must be loaded, generate a loop just executing the pipeline `num_rows`-times. -----*/

    if (schema.num_entries() == 0) {

        setup();

        WHILE (tuple_id < num_rows) {

            tuple_id += uint32_t(num_simd_lanes);

            pipeline();

        }

        teardown();

        return;

    }


    /*----- Import the base address of the mapped memory. -----*/

    Ptr<void> base_address = get_base_address(table.name());


    /*----- Emit setup code *before* compiling data layout to not overwrite its temporary boolean variables. -----*/

    setup();


    /*----- Compile data layout to generate sequential load from table. -----*/

    static Schema empty_schema;

    auto [inits, loads, jumps] = compile_load_sequential(schema, empty_schema, base_address, table.layout(),

                                                         num_simd_lanes, layout_schema, tuple_id);


    /*----- Generate the loop for the actual scan, with the pipeline emitted into the loop body. -----*/

    inits.attach_to_current();

    WHILE (tuple_id < num_rows) {

        loads.attach_to_current();

        pipeline();

        jumps.attach_to_current();

    }


    /*----- Emit teardown code. -----*/

    teardown();

}


/*======================================================================================================================

 * Index Scan

 *====================================================================================================================*/


template<idx::IndexMethod IndexMethod>

ConditionSet IndexScan<IndexMethod>::pre_condition(std::size_t child_idx,

                                                   const std::tuple<const FilterOperator*,

                                                   const ScanOperator*> &partial_inner_nodes)

{

    M_insist(child_idx == 0);


    /*----- Check if index on one of the attributes in filter condition exists. -----*/

    auto &filter = *std::get<0>(partial_inner_nodes);

    auto &cnf = filter.filter();


    M_insist(not cnf.empty(), "Filter condition must not be empty");


    auto &scan = *std::get<1>(partial_inner_nodes);

    auto &table = scan.store().table();


    Catalog &C = Catalog::Get();

    auto &DB = C.get_database_in_use();


    /* Extract attributes from filter condition. */

    std::vector<Schema::Identifier> ids;

    for (auto &entry : cnf.get_required()) {

        Schema::Identifier &id = entry.id;

        M_insist(table.name() == id.prefix, "Table name should match designator table name");


        /* Keep attributes for which an index exists. */

        if (DB.has_index(table.name(), id.name, IndexMethod))

            ids.push_back(id);

    }

    if (ids.empty()) // no usable index found

        return ConditionSet::Make_Unsatisfiable();


    /*----- Check if filter condition is supported. -----*/

    /* We currently only support filter conditions of the following form.

     * 1. Point: condition with a single equality predicate, e.g.

     *    x = 42.

     * 2. One-sided range: condition with a single greater/greater-or-equal/less/less-or-equal predicate, e.g.

     *    x > 42.

     * 3. Two-sided range: condition with a greater/greater-or-equal predicate and a less/less-or-equal predicate, e.g.

     *    x > 42 AND x <= 89.

     * Attributes may appear on either side.  The other side is required to be a `Constant`. */

    if (ids.size() > 1) // conditions with more than one attribute currently not supported

        return ConditionSet::Make_Unsatisfiable();


    bool has_lo_bound = false;

    bool has_hi_bound = false;

    for (auto &clause : cnf) {

        if (clause.size() != 1) // disjunctions not supported

            return ConditionSet::Make_Unsatisfiable();


        auto &predicate = clause[0];

        if (predicate.negative()) // negated predicates not supported

            return ConditionSet::Make_Unsatisfiable();


        auto expr = cast<const BinaryExpr>(&predicate.expr());

        if (not expr) // not a binary expression

            return ConditionSet::Make_Unsatisfiable();


        bool has_attribute_left = is<const Designator>(expr->lhs);

        auto &attribute = has_attribute_left ? *expr->lhs : *expr->rhs;

        auto &constant = has_attribute_left ? *expr->rhs : *expr->lhs;

        if (not is<const Designator>(attribute)) // attribute must be on lhs

            return ConditionSet::Make_Unsatisfiable();

        if (not is_valid_bound(constant))

            return ConditionSet::Make_Unsatisfiable();


        switch(expr->tok.type) {

            default:

                return ConditionSet::Make_Unsatisfiable();

            case TK_EQUAL:

                if (not has_lo_bound and not has_hi_bound) { // lo and hi bound not yet set

                    has_lo_bound = has_hi_bound = true;

                } else {

                    return ConditionSet::Make_Unsatisfiable();

                }

                break;

            case TK_GREATER:

            case TK_GREATER_EQUAL:

                if (has_attribute_left and not has_lo_bound) { // attribute on lhs, lo bound not yet set

                    has_lo_bound = true;

                } else if (not has_attribute_left and not has_hi_bound) { // attribute on rhs, hi bound not yet set

                    has_hi_bound = true;

                } else {

                    return ConditionSet::Make_Unsatisfiable();

                }

                break;

            case TK_LESS:

            case TK_LESS_EQUAL:

                if (has_attribute_left and not has_hi_bound) { // attribute on lhs, hi bound not yet set

                    has_hi_bound = true;

                } else if (not has_attribute_left and not has_lo_bound) { // attribute on rhs, lo bound not yet set

                    has_lo_bound = true;

                } else {

                    return ConditionSet::Make_Unsatisfiable();

                }

                break;

        }

    }

    return ConditionSet();

}


template<idx::IndexMethod IndexMethod>

ConditionSet IndexScan<IndexMethod>::post_condition(const Match<IndexScan<IndexMethod>> &M)

{

    ConditionSet post_cond;


    /*----- Index scan does not introduce predication. -----*/

    post_cond.add_condition(Predicated(false));


    /*----- Non-SIMDfied index scan does not introduce SIMD. -----*/

    post_cond.add_condition(NoSIMD());


    /*----- Index scan introduces sortedness on indexed attribute. -----*/

    /* Extract identifier from cnf. */

    auto &cnf = M.filter.filter();

    Schema designators = cnf.get_required();

    M_insist(designators.num_entries() == 1, "filter condition must contain exactly one designator");

    Schema::Identifier &id = designators[0].id;


    /* Add sortedness post condition. */

    Sortedness::order_t orders;

    orders.add(id, Sortedness::O_ASC);

    post_cond.add_condition(Sortedness(std::move(orders)));


    return post_cond;

}


template<idx::IndexMethod IndexMethod>

double IndexScan<IndexMethod>::cost(const Match<IndexScan<IndexMethod>>&)

{

    /* TODO: add meaningful cost function. */

    return 0.0;

}


template<idx::IndexMethod IndexMethod, typename Index, sql_type SqlT>

void index_scan_codegen_compilation(const Index &index, const index_scan_bounds_t &bounds,

                                    const Match<IndexScan<IndexMethod>> &M,

                                    setup_t setup, pipeline_t pipeline, teardown_t teardown) {

    using key_type = Index::key_type;

    using value_type = Index::value_type;

    constexpr uint32_t entry_size = sizeof(typename Index::entry_type);

    using sql_type = SqlT;


    auto table_name = M.scan.store().table().name();

    auto attr_name = bounds.attribute.id.name;


    if (options::index_scan_compilation_strategy == option_configs::IndexScanCompilationStrategy::CALLBACK) {

        /*----- Resolve callback function names. -----*/

        const char *scan_fn, *lower_bound_fn, *upper_bound_fn;

#define SET_CALLBACK_FNS(INDEX, KEY) \

        scan_fn        = M_STR(idx_scan_##INDEX##_##KEY); \

        lower_bound_fn = M_STR(idx_lower_bound_##INDEX##_##KEY); \

        upper_bound_fn = M_STR(idx_upper_bound_##INDEX##_##KEY)


#define RESOLVE_KEYTYPE(INDEX) \

        if constexpr(std::same_as<SqlT, _Boolx1>) { \

            SET_CALLBACK_FNS(INDEX, b); \

        } else if constexpr(std::same_as<sql_type, _I8x1>) { \

            SET_CALLBACK_FNS(INDEX, i1); \

        } else if constexpr(std::same_as<sql_type, _I16x1>) { \

            SET_CALLBACK_FNS(INDEX, i2); \

        } else if constexpr(std::same_as<sql_type, _I32x1>) { \

            SET_CALLBACK_FNS(INDEX, i4); \

        } else if constexpr(std::same_as<sql_type, _I64x1>) { \

            SET_CALLBACK_FNS(INDEX, i8); \

        } else if constexpr(std::same_as<sql_type, _Floatx1>) { \

            SET_CALLBACK_FNS(INDEX, f); \

        } else if constexpr(std::same_as<sql_type, _Doublex1>) { \

            SET_CALLBACK_FNS(INDEX, d); \

        } else if constexpr(std::same_as<sql_type, NChar>) { \

            SET_CALLBACK_FNS(IDNEX, p); \

        } else { \

            M_unreachable("incompatible SQL type"); \

        }

        if constexpr(is_specialization<Index, idx::ArrayIndex>) {

            RESOLVE_KEYTYPE(array)

        } else if constexpr(is_specialization<Index, idx::RecursiveModelIndex>) {

            RESOLVE_KEYTYPE(rmi)

        } else {

            M_unreachable("unknown index type");

        }

#undef RESOLVE_KEYTYPE

#undef SET_CALLBACK_FNS


        /*----- Add index to context. -----*/

        auto &context = WasmEngine::Get_Wasm_Context_By_ID(Module::ID());

        U64x1 index_id(context.add_index(index));


        /*----- Emit host calls to query the index for lo and hi bounds. -----*/

        auto compile_bound_lookup = [&](const ast::Expr &bound, bool is_lower_bound) {

            auto [constant, is_negative] = get_valid_bound(bound);

            auto c = Interpreter::eval(constant);

            key_type _key;

            if constexpr(m::boolean<key_type>) {

                _key = bool(c);

                M_insist(not is_negative, "boolean cannot be negative");

            } else if constexpr(m::integral<key_type>) {

                auto i64 = int64_t(c);

                M_insist(std::in_range<key_type>(i64), "integral constant must be in range");

                _key = key_type(i64);

                _key = is_negative ? -_key : _key;

            } else if constexpr(std::same_as<float, key_type>) {

                auto d = double(c);

                _key = key_type(d);

                M_insist(_key == d, "downcasting should not impact precision");

                _key = is_negative ? -_key : _key;

            } else if constexpr(std::same_as<double, key_type>) {

                _key = double(c);

                _key = is_negative ? -_key : _key;

            } else if constexpr(std::same_as<const char*, key_type>) {

                _key = reinterpret_cast<const char*>(c.as_p());

                M_insist(not is_negative, "string cannot be negative");

            }


            std::optional<typename sql_type::primitive_type> key;

            if (options::index_scan_materialization_strategy == option_configs::IndexScanMaterializationStrategy::INLINE) {

                if constexpr (std::same_as<sql_type, NChar>) {

                    key.emplace(CodeGenContext::Get().get_literal_address(_key));

                } else {

                    key.emplace(_key);

                }

            } else if (options::index_scan_materialization_strategy == option_configs::IndexScanMaterializationStrategy::MEMORY) {

                /* If we materialize before calling the bound functions, the key parameter is independent of the bounds.

                 * As a result, queries that only differ in the filter predicate are compiled to the exact same

                 * WebAssembly code, enabling caching of compiled plans in V8. */

                if constexpr (std::same_as<sql_type, NChar>) {

                    uint32_t *key_address = Module::Allocator().raw_malloc<uint32_t>();

                    *key_address = CodeGenContext::Get().get_literal_raw_address(_key);


                    Ptr<U32x1> key_ptr(key_address);

                    key.emplace(U32x1(*key_ptr).to<char*>());

                } else {

                    auto *key_address = Module::Allocator().raw_malloc<key_type>();

                    *key_address = _key;


                    Ptr<typename sql_type::primitive_type> key_ptr(key_address);

                    key.emplace(*key_ptr);

                }

            } else {

                M_unreachable("unknown materialization strategy");

            }

            M_insist(bool(key), "key must be set");

            return Module::Get().emit_call<uint32_t>(

                /* fn=       */ is_lower_bound ? lower_bound_fn : upper_bound_fn,

                /* index_id= */ index_id.clone(),

                /* key=      */ *key

            );

        };

        Var<U32x1> lo(bool(bounds.lo) ? compile_bound_lookup(bounds.lo->get(), bounds.is_inclusive_lo)

                                      : U32x1(0));

        const Var<U32x1> hi(bool(bounds.hi) ? compile_bound_lookup(bounds.hi->get(), not bounds.is_inclusive_hi)

                                      : U32x1(index.num_entries()));

        Wasm_insist(lo <= hi, "bounds need to be valid");


        /*----- Allocate memory for communication to host. -----*/

        M_insist(std::in_range<uint32_t>(M.batch_size), "should fit in uint32_t");


        /* Determine alloc size as minimum of number of results and command-line parameter batch size, where 0 is

         * interpreted as infinity. */

        const Var<U32x1> alloc_size([&](){

            U32x1 num_results = hi - lo;

            U32x1 num_results_cpy = num_results.clone();

            U32x1 batch_size = M.batch_size == 0 ? num_results.clone() : U32x1(M.batch_size);

            U32x1 batch_size_cpy = batch_size.clone();

            return Select(batch_size < num_results, batch_size_cpy, num_results_cpy);

        }());

        Ptr<U32x1> buffer_address = Module::Allocator().malloc<uint32_t>(alloc_size);


        /*----- Emit setup code *after* allocating memory to guarantee sequential memory allocation for pipeline. -----*/

        setup();


        /*----- Emit loop code. -----*/

        Var<U32x1> num_tuples_in_batch;

        Var<Ptr<U32x1>> ptr;

        WHILE (lo < hi) {

            num_tuples_in_batch = Select(hi - lo > alloc_size, alloc_size, hi - lo);

            /* Call host to fill buffer memory with next batch of tuple ids. */

            Module::Get().emit_call<void>(

                /* fn=           */ scan_fn,

                /* index_id=     */ index_id,

                /* entry_offset= */ lo.val(),

                /* address=      */ buffer_address.clone(),

                /* batch_size=   */ num_tuples_in_batch.val()

            );

            lo += num_tuples_in_batch;

            ptr = buffer_address.clone();

            WHILE (num_tuples_in_batch > 0U) {

                static Schema empty_schema;

                compile_load_point_access(

                    /* tuple_value_schema=   */ M.scan.schema(),

                    /* tuple_address_schema= */ empty_schema,

                    /* base_address=         */ get_base_address(table_name),

                    /* layout=               */ M.scan.store().table().layout(),

                    /* layout_schema=        */ M.scan.store().table().schema(M.scan.alias()),

                    /* tuple_id=             */ *ptr

                );

                pipeline();

                num_tuples_in_batch -= 1U;

                ptr += 1;

            }

        }


        /*----- Emit teardown code. -----*/

        teardown();


        /*----- Free buffer memory. -----*/

        IF (alloc_size > U32x1(0)) { // only free if actually allocated

            Module::Allocator().free(buffer_address, alloc_size);

        };

    } else if (options::index_scan_compilation_strategy == option_configs::IndexScanCompilationStrategy::EXPOSED_MEMORY) {

        /*----- Use binary search to query the index for lo and hi bounds. -----*/

        auto compile_bound_lookup = [&](const ast::Expr &bound, bool is_lower_bound) {

            auto [constant, is_negative] = get_valid_bound(bound);

            auto c = Interpreter::eval(constant);

            key_type _key;

            if constexpr(m::boolean<key_type>) {

                _key = bool(c);

                M_insist(not is_negative, "boolean cannot be negative");

            } else if constexpr(m::integral<key_type>) {

                auto i64 = int64_t(c);

                M_insist(std::in_range<key_type>(i64), "integral constant must be in range");

                _key = key_type(i64);

                _key = is_negative ? -_key : _key;

            } else if constexpr(std::same_as<float, key_type>) {

                auto d = double(c);

                _key = key_type(d);

                M_insist(_key == d, "downcasting should not impact precision");

                _key = is_negative ? -_key : _key;

            } else if constexpr(std::same_as<double, key_type>) {

                _key = double(c);

                _key = is_negative ? -_key : _key;

            } else if constexpr(std::same_as<const char*, key_type>) {

                _key = reinterpret_cast<const char*>(c.as_p());

                M_insist(not is_negative, "string cannot be negative");

            }


            std::optional<typename sql_type::primitive_type> key;

            if (options::index_scan_materialization_strategy == option_configs::IndexScanMaterializationStrategy::INLINE) {

                if constexpr (std::same_as<sql_type, NChar>) {

                    key.emplace(CodeGenContext::Get().get_literal_address(_key));

                } else {

                    key.emplace(_key);

                }

            } else if (options::index_scan_materialization_strategy == option_configs::IndexScanMaterializationStrategy::MEMORY) {

                /* If we materialize before calling the bound functions, the key parameter is independent of the bounds.

                 * As a result, queries that only differ in the filter predicate are compiled to the exact same

                 * WebAssembly code, enabling caching of compiled plans in V8. */

                if constexpr (std::same_as<sql_type, NChar>) {

                    uint32_t *key_address = Module::Allocator().raw_malloc<uint32_t>();

                    *key_address = CodeGenContext::Get().get_literal_raw_address(_key);


                    Ptr<U32x1> key_ptr(key_address);

                    key.emplace(U32x1(*key_ptr).to<char*>());

                } else {

                    auto *key_address = Module::Allocator().raw_malloc<key_type>();

                    *key_address = _key;


                    Ptr<typename sql_type::primitive_type> key_ptr(key_address);

                    key.emplace(*key_ptr);

                }

            } else {

                M_unreachable("unknown materialization strategy");

            }

            M_insist(bool(key), "key must be set");


            /* Implementation based on https://en.cppreference.com/w/cpp/algorithm/lower_bound and

             * https://en.cppreference.com/w/cpp/algorithm/upper_bound. */

            Var<Ptr<void>> first(get_array_index_base_address(table_name, attr_name));

            Var<U32x1> count(get_array_index_num_entries(table_name, attr_name));


            WHILE (count > 0U) {

                const Var<U32x1> step(count / 2U);

                const Var<Ptr<void>> it(first + (step * entry_size).make_signed());

                Boolx1 cond = M_CONSTEXPR_COND(

                    std::same_as<M_COMMA(sql_type) NChar>,

                    strcmp(

                        NChar(it.to<char*>(), false, as<const CharacterSequence>(bound.type())),

                        NChar(*key, false, as<const CharacterSequence>(bound.type())),

                        is_lower_bound ? LT : LE

                    ).insist_not_null(),

                    M_CONSTEXPR_COND(

                        std::same_as<M_COMMA(key_type) bool>,

                        is_lower_bound ? Boolx1(*it.to<bool*>()).to<uint8_t>() <  (*key).template to<uint8_t>()

                                       : Boolx1(*it.to<bool*>()).to<uint8_t>() <= (*key).template to<uint8_t>(),

                        is_lower_bound ? *it.to<key_type*>() < *key : *it.to<key_type*>() <= *key

                    )

                );

                IF (cond) {

                    first = it + entry_size;

                    count -= step + 1U;

                } ELSE {

                    count = step;

                };

            }

            return first;

        };

        Var<Ptr<void>> lo(

            bool(bounds.lo) ? compile_bound_lookup(bounds.lo->get(), bounds.is_inclusive_lo)

                            : get_array_index_base_address(table_name, attr_name)

        );

        const Var<Ptr<void>> hi(

            bool(bounds.hi) ? compile_bound_lookup(bounds.hi->get(), not bounds.is_inclusive_hi)

                            : get_array_index_base_address(table_name, attr_name)

                              + (get_array_index_num_entries(table_name, attr_name) * entry_size).make_signed()

        );

        Wasm_insist(lo <= hi, "bounds need to be valid");


        /*----- Emit setup code *after* allocating memory to guarantee sequential memory allocation for pipeline. -----*/

        setup();


        /*----- Emit loop code. -----*/

        WHILE (lo < hi) {

            constexpr int32_t value_offset =

                ((sizeof(key_type) + alignof(value_type) - 1U) / alignof(value_type)) * alignof(value_type);

            U32x1 tuple_id = PrimitiveExpr<value_type>(*(lo + value_offset).to<value_type*>()).template to<uint32_t>();

            static Schema empty_schema;

            compile_load_point_access(

                /* tuple_value_schema=   */ M.scan.schema(),

                /* tuple_address_schema= */ empty_schema,

                /* base_address=         */ get_base_address(table_name),

                /* layout=               */ M.scan.store().table().layout(),

                /* layout_schema=        */ M.scan.store().table().schema(M.scan.alias()),

                /* tuple_id=             */ tuple_id

            );

            pipeline();

            lo += int32_t(entry_size);

        }


        /*----- Emit teardown code. -----*/

        teardown();

    } else {

        M_unreachable("unknown compilation strategy");

    }

}


template<idx::IndexMethod IndexMethod, typename Index>

void index_scan_codegen_interpretation(const Index &index, const index_scan_bounds_t &bounds,

                                       const Match<IndexScan<IndexMethod>> &M,

                                       setup_t setup, pipeline_t pipeline, teardown_t teardown)

{

    using key_type = Index::key_type;


    static Schema empty_schema;


    /*----- Interpret lo and hi bounds to retrieve index scan range -----*/

    auto interpret_and_lookup_bound = [&](const ast::Expr &bound, bool is_lower_bound) -> std::size_t {

        auto [constant, is_negative] = get_valid_bound(bound);

        auto c = Interpreter::eval(constant);

        key_type key;

        if constexpr(m::boolean<key_type>) {

            key = bool(c);

            M_insist(not is_negative, "boolean cannot be negative");

        } else if constexpr(m::integral<key_type>) {

            auto i64 = int64_t(c);

            M_insist(std::in_range<key_type>(i64), "integral constant must be in range");

            key = key_type(i64);

            key = is_negative ? -key : key;

        } else if constexpr(std::same_as<float, key_type>) {

            auto d = double(c);

            key = key_type(d);

            M_insist(key == d, "downcasting should not impact precision");

            key = is_negative ? -key : key;

        } else if constexpr(std::same_as<double, key_type>) {

            key = double(c);

            key = is_negative ? -key : key;

        } else if constexpr(std::same_as<const char*, key_type>) {

            key = reinterpret_cast<const char*>(c.as_p());

            M_insist(not is_negative, "string cannot be negative");

        }

        return std::distance(index.begin(), is_lower_bound ? index.lower_bound(key)

                                                           : index.upper_bound(key));

    };

    std::size_t lo = bool(bounds.lo) ? interpret_and_lookup_bound(bounds.lo->get(), bounds.is_inclusive_lo)

                                     : 0UL;

    std::size_t hi = bool(bounds.hi) ? interpret_and_lookup_bound(bounds.hi->get(), not bounds.is_inclusive_hi)

                                     : index.num_entries();

    M_insist(lo <= hi, "bounds need to be valid");


    if (options::index_scan_materialization_strategy == option_configs::IndexScanMaterializationStrategy::MEMORY) {

        /*----- Allocate sufficient memory for results. -----*/

        uint32_t num_results = hi - lo;

        uint32_t *buffer_address = Module::Allocator().raw_malloc<uint32_t>(num_results + 1); // +1 for storing number of results itself


        /*----- Perform index scan and fill memory with number of results and results. -----*/

        uint32_t *buffer_ptr = buffer_address;

        *buffer_ptr = num_results; // store in memory to enable caching

        ++buffer_ptr;

        for (auto it = index.begin() + lo; it != index.begin() + hi; ++it) {

            M_insist(std::in_range<uint32_t>(it->second), "tuple id must fit in uint32_t");

            *buffer_ptr = it->second;

            ++buffer_ptr;

        }


        /*----- Emit setup code *after* allocating memory to guarantee sequential memory allocation for pipeline. -----*/

        setup();


        /*----- Emit loop code. -----*/

        Ptr<U32x1> base(buffer_address + 1); // +1 to skip stored number of results

        Var<Ptr<U32x1>> ptr(base.clone());

        const Var<Ptr<U32x1>> end(base + U32x1(*Ptr<U32x1>(buffer_address)).make_signed());

        WHILE (ptr < end) {

            compile_load_point_access(

                /* tuple_value_schema=   */ M.scan.schema(),

                /* tuple_address_schema= */ empty_schema,

                /* base_address=         */ get_base_address(M.scan.store().table().name()),

                /* layout=               */ M.scan.store().table().layout(),

                /* layout_schema=        */ M.scan.store().table().schema(M.scan.alias()),

                /* tuple_id=             */ *ptr

            );

            pipeline();

            ptr += 1;

        }


        /*----- Emit teardown code. -----*/

        teardown();

    } else if (options::index_scan_materialization_strategy == option_configs::IndexScanMaterializationStrategy::INLINE) {

        /*----- Define function that emits code for loading and executing pipeline for a single tuple. -----*/

        FUNCTION(index_scan_parent_pipeline, void(uint32_t))

        {

            auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function


            /*----- Emit setup code. -----*/

            setup();


            /*----- Load tuple. ----- */

            compile_load_point_access(

                /* tuple_value_schema=   */ M.scan.schema(),

                /* tuple_address_schema= */ empty_schema,

                /* base_address=         */ get_base_address(M.scan.store().table().name()),

                /* layout=               */ M.scan.store().table().layout(),

                /* layout_schema=        */ M.scan.store().table().schema(M.scan.alias()),

                /* tuple_id=             */ PARAMETER(0)

            );


            /*----- Emit pipeline code. -----*/

            pipeline();


            /*----- Emit teardown code. -----*/

            teardown();

        }


        /*----- Perform index sequential scan, emit code to execute pipeline for each tuple. -----*/

        for (auto it = index.begin() + lo; it != index.begin() + hi; ++it) {

            M_insist(std::in_range<uint32_t>(it->second), "tuple id must fit in uint32_t");

            index_scan_parent_pipeline(uint32_t(it->second));

        }

    } else {

        M_unreachable("unknown materialization strategy");

    }

}


template<idx::IndexMethod IndexMethod, typename Index, sql_type SqlT>

void index_scan_codegen_hybrid(const Index &index, const index_scan_bounds_t &bounds,

                               const Match<IndexScan<IndexMethod>> &M,

                               setup_t setup, pipeline_t pipeline, teardown_t teardown)

{

    using key_type = Index::key_type;

    using value_type = Index::value_type;

    constexpr uint32_t entry_size = sizeof(typename Index::entry_type);

    using sql_type = SqlT;


    auto table_name = M.scan.store().table().name();

    auto attr_name = bounds.attribute.id.name;


    /*----- Resolve callback function name. -----*/

    const char *scan_fn;

#define SET_CALLBACK_FNS(INDEX, KEY) \

    scan_fn = M_STR(idx_scan_##INDEX##_##KEY)


#define RESOLVE_KEYTYPE(INDEX) \

    if constexpr(std::same_as<SqlT, _Boolx1>) { \

        SET_CALLBACK_FNS(INDEX, b); \

    } else if constexpr(std::same_as<sql_type, _I8x1>) { \

        SET_CALLBACK_FNS(INDEX, i1); \

    } else if constexpr(std::same_as<sql_type, _I16x1>) { \

        SET_CALLBACK_FNS(INDEX, i2); \

    } else if constexpr(std::same_as<sql_type, _I32x1>) { \

        SET_CALLBACK_FNS(INDEX, i4); \

    } else if constexpr(std::same_as<sql_type, _I64x1>) { \

        SET_CALLBACK_FNS(INDEX, i8); \

    } else if constexpr(std::same_as<sql_type, _Floatx1>) { \

        SET_CALLBACK_FNS(INDEX, f); \

    } else if constexpr(std::same_as<sql_type, _Doublex1>) { \

        SET_CALLBACK_FNS(INDEX, d); \

    } else if constexpr(std::same_as<sql_type, NChar>) { \

        SET_CALLBACK_FNS(IDNEX, p); \

    } else { \

        M_unreachable("incompatible SQL type"); \

    }

    if constexpr(is_specialization<Index, idx::ArrayIndex>) {

        RESOLVE_KEYTYPE(array)

    } else if constexpr(is_specialization<Index, idx::RecursiveModelIndex>) {

        RESOLVE_KEYTYPE(rmi)

    } else {

        M_unreachable("unknown index type");

    }

#undef RESOLVE_KEYTYPE

#undef SET_CALLBACK_FNS


    /*----- Add index to context. -----*/

    auto &context = WasmEngine::Get_Wasm_Context_By_ID(Module::ID());

    U64x1 index_id(context.add_index(index));


    /*----- Interpret lo and hi bounds to retrieve index scan range -----*/

    auto interpret_and_lookup_bound = [&](const ast::Expr &bound, bool is_lower_bound) -> std::size_t {

        auto [constant, is_negative] = get_valid_bound(bound);

        auto c = Interpreter::eval(constant);

        key_type key;

        if constexpr(m::boolean<key_type>) {

            key = bool(c);

            M_insist(not is_negative, "boolean cannot be negative");

        } else if constexpr(m::integral<key_type>) {

            auto i64 = int64_t(c);

            M_insist(std::in_range<key_type>(i64), "integral constant must be in range");

            key = key_type(i64);

            key = is_negative ? -key : key;

        } else if constexpr(std::same_as<float, key_type>) {

            auto d = double(c);

            key = key_type(d);

            M_insist(key == d, "downcasting should not impact precision");

            key = is_negative ? -key : key;

        } else if constexpr(std::same_as<double, key_type>) {

            key = double(c);

            key = is_negative ? -key : key;

        } else if constexpr(std::same_as<const char*, key_type>) {

            key = reinterpret_cast<const char*>(c.as_p());

            M_insist(not is_negative, "string cannot be negative");

        }

        return std::distance(index.begin(), is_lower_bound ? index.lower_bound(key)

                                                           : index.upper_bound(key));

    };

    std::size_t lo = bool(bounds.lo) ? interpret_and_lookup_bound(bounds.lo->get(), bounds.is_inclusive_lo)

                                     : 0UL;

    std::size_t hi = bool(bounds.hi) ? interpret_and_lookup_bound(bounds.hi->get(), not bounds.is_inclusive_hi)

                                     : index.num_entries();

    M_insist(lo <= hi, "bounds need to be valid");

    M_insist(std::in_range<uint32_t>(lo), "should fit in uint32_t");

    M_insist(std::in_range<uint32_t>(hi), "should fit in uint32_t");


    /*----- Materialize offsets hi and lo. -----*/

    std::optional<U32x1> begin;

    std::optional<U32x1> end;

    if (options::index_scan_materialization_strategy == option_configs::IndexScanMaterializationStrategy::INLINE) {

        begin.emplace(lo);

        end.emplace(hi);

    } else if (options::index_scan_materialization_strategy == option_configs::IndexScanMaterializationStrategy::MEMORY) {

        /* If we materialize before allocating buffer memory, the addresses are independent of the buffer size.  As a

         * result, queries that only differ in the filter predicate are compiled to the exact same WebAssembly code,

         * enabling caching of compiled plans in V8. */

        uint32_t *offset_address = Module::Allocator().raw_malloc<uint32_t>(2);

        offset_address[0] = uint32_t(lo);

        offset_address[1] = uint32_t(hi);


        Ptr<U32x1> offset_ptr(offset_address);

        begin.emplace(*offset_ptr.clone());

        end.emplace(*(offset_ptr + 1));

    } else {

        M_unreachable("unknown materialization strategy");

    }

    M_insist(bool(end), "end must be set");


    if (options::index_scan_compilation_strategy == option_configs::IndexScanCompilationStrategy::CALLBACK) {

        /*----- Allocate buffer memory for communication to host. -----*/

        M_insist(std::in_range<uint32_t>(M.batch_size), "should fit in uint32_t");


        /* Determine alloc size as minimum of number of results and command-line parameter batch size, where 0 is

         * interpreted as infinity. */

        const Var<U32x1> alloc_size([&](){

            U32x1 num_results = end->clone() - begin->clone();

            U32x1 num_results_cpy = num_results.clone();

            U32x1 batch_size = M.batch_size == 0 ? num_results.clone() : U32x1(M.batch_size);

            U32x1 batch_size_cpy = batch_size.clone();

            return Select(batch_size < num_results, batch_size_cpy, num_results_cpy);

        }());

        Ptr<U32x1> buffer_address = Module::Allocator().malloc<uint32_t>(alloc_size);


        /*----- Emit setup code *after* allocating memory to guarantee sequential memory allocation for pipeline. -----*/

        setup();


        /*----- Emit loop code. -----*/

        Var<U32x1> num_tuples_in_batch;

        Var<Ptr<U32x1>> ptr;

        Var<U32x1> _begin(*begin);

        WHILE (_begin < end->clone()) {

            auto end_cpy = end->clone();

            num_tuples_in_batch = Select(*end - _begin > alloc_size, alloc_size, end_cpy - _begin);

            /* Call host to fill buffer memory with next batch of tuple ids. */

            Module::Get().emit_call<void>(

                /* fn=           */ scan_fn,

                /* index_id=     */ index_id,

                /* entry_offset= */ _begin.val(),

                /* address=      */ buffer_address.clone(),

                /* batch_size=   */ num_tuples_in_batch.val()

            );

            _begin += num_tuples_in_batch;

            ptr = buffer_address.clone();

            WHILE (num_tuples_in_batch > 0U) {

                static Schema empty_schema;

                compile_load_point_access(

                    /* tuple_value_schema=   */ M.scan.schema(),

                    /* tuple_address_schema= */ empty_schema,

                    /* base_address=         */ get_base_address(table_name),

                    /* layout=               */ M.scan.store().table().layout(),

                    /* layout_schema=        */ M.scan.store().table().schema(M.scan.alias()),

                    /* tuple_id=             */ *ptr

                );

                pipeline();

                num_tuples_in_batch -= 1U;

                ptr += 1;

            }

        }


        /*----- Emit teardown code. -----*/

        teardown();


        /*----- Free buffer memory. -----*/

        IF (alloc_size > U32x1(0)) { // only free if actually allocated

            Module::Allocator().free(buffer_address, alloc_size);

        };

    } else if (options::index_scan_compilation_strategy == option_configs::IndexScanCompilationStrategy::EXPOSED_MEMORY) {

        /*----- Emit setup code *after* allocating memory to guarantee sequential memory allocation for pipeline. -----*/

        setup();


        /*----- Emit loop code. -----*/

        Var<I32x1> lo((*begin * entry_size).make_signed());

        const Var<I32x1> hi((*end * entry_size).make_signed());

        WHILE (lo < hi) {

            constexpr int32_t value_offset =

                ((sizeof(key_type) + alignof(value_type) - 1U) / alignof(value_type)) * alignof(value_type);

            U32x1 tuple_id = PrimitiveExpr<value_type>(*(get_array_index_base_address(table_name, attr_name) + lo + value_offset).template to<value_type*>()).template to<uint32_t>();

            static Schema empty_schema;

            compile_load_point_access(

                /* tuple_value_schema=   */ M.scan.schema(),

                /* tuple_address_schema= */ empty_schema,

                /* base_address=         */ get_base_address(table_name),

                /* layout=               */ M.scan.store().table().layout(),

                /* layout_schema=        */ M.scan.store().table().schema(M.scan.alias()),

                /* tuple_id=             */ tuple_id

            );

            pipeline();

            lo += int32_t(entry_size);

        }


        /*----- Emit teardown code. -----*/

        teardown();


        /*----- Discard unused values. ----*/

        index_id.discard();

    } else {

        M_unreachable("unknown compilation strategy");

    }

}


template<idx::IndexMethod IndexMethod, typename Index, sql_type SqlT>

void index_scan_resolve_strategy(const Index &index, const index_scan_bounds_t &bounds, const Match<IndexScan<IndexMethod>> &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)

{

    if (options::index_scan_strategy == option_configs::IndexScanStrategy::COMPILATION) {

        index_scan_codegen_compilation<IndexMethod, Index, SqlT>(index, bounds, M, std::move(setup), std::move(pipeline), std::move(teardown));

    } else if (options::index_scan_strategy == option_configs::IndexScanStrategy::INTERPRETATION) {

        index_scan_codegen_interpretation<IndexMethod, Index>(index, bounds, M, std::move(setup), std::move(pipeline), std::move(teardown));

    } else if (options::index_scan_strategy == option_configs::IndexScanStrategy::HYBRID) {

        index_scan_codegen_hybrid<IndexMethod, Index, SqlT>(index, bounds, M, std::move(setup), std::move(pipeline), std::move(teardown));

    } else {

        M_unreachable("invalid index access strategy");

    }

}


template<idx::IndexMethod IndexMethod, typename AttrT, sql_type SqlT>

void index_scan_resolve_index_method(const index_scan_bounds_t &bounds, const Match<IndexScan<IndexMethod>> &M,

                                     setup_t setup, pipeline_t pipeline, teardown_t teardown)

{

    /*----- Lookup index. -----*/

    Catalog &C = Catalog::Get();

    auto &DB = C.get_database_in_use();

    auto &table_name = M.scan.store().table().name();

    auto &attribute_name = bounds.attribute.id.name;

    auto &index_base = DB.get_index(table_name, attribute_name, IndexMethod);


    /*----- Resolve index type. -----*/

    if constexpr(IndexMethod == idx::IndexMethod::Array and requires { typename idx::ArrayIndex<AttrT>; }) {

        auto &index = as<const idx::ArrayIndex<AttrT>>(index_base);

        index_scan_resolve_strategy<IndexMethod, const idx::ArrayIndex<AttrT>, SqlT>(

            index, bounds, M, std::move(setup), std::move(pipeline), std::move(teardown)

        );

    } else if constexpr(IndexMethod == idx::IndexMethod::Rmi and requires { typename idx::RecursiveModelIndex<AttrT>; }) {

        auto &index = as<const idx::RecursiveModelIndex<AttrT>>(index_base);

        index_scan_resolve_strategy<IndexMethod, const idx::RecursiveModelIndex<AttrT>, SqlT>(

            index, bounds, M, std::move(setup), std::move(pipeline), std::move(teardown)

        );

    } else {

        M_unreachable("invalid index method");

    }

}


template<idx::IndexMethod IndexMethod>

void index_scan_resolve_attribute_type(const Match<IndexScan<IndexMethod>> &M,

                                       setup_t setup, pipeline_t pipeline, teardown_t teardown)

{

    /*----- Extract bounds from CNF. -----*/

    auto &cnf = M.filter.filter();

    auto bounds = extract_index_scan_bounds(cnf);


    /*----- Resolve attribute type. -----*/

#define RESOLVE_INDEX_METHOD(ATTRTYPE, SQLTYPE) \

    index_scan_resolve_index_method<IndexMethod, ATTRTYPE, SQLTYPE>(bounds, M, std::move(setup), std::move(pipeline), std::move(teardown))


    visit(overloaded {

        [&](const Boolean&) { RESOLVE_INDEX_METHOD(bool, _Boolx1); },

        [&](const Numeric &n) {

            switch (n.kind) {

                case Numeric::N_Int:

                case Numeric::N_Decimal:

                    switch (n.size()) {

                        default: M_unreachable("invalid size");

                        case  8: RESOLVE_INDEX_METHOD(int8_t,   _I8x1); break;

                        case 16: RESOLVE_INDEX_METHOD(int16_t, _I16x1); break;

                        case 32: RESOLVE_INDEX_METHOD(int32_t, _I32x1); break;

                        case 64: RESOLVE_INDEX_METHOD(int64_t, _I64x1); break;

                    }

                    break;

                case Numeric::N_Float:

                    switch (n.size()) {

                        default: M_unreachable("invalid size");

                        case 32: RESOLVE_INDEX_METHOD(float,   _Floatx1); break;

                        case 64: RESOLVE_INDEX_METHOD(double, _Doublex1); break;

                    }

                    break;

            }

        },

        [&](const CharacterSequence&) { RESOLVE_INDEX_METHOD(const char*, NChar); },

        [&](const Date&) { RESOLVE_INDEX_METHOD(int32_t, _I32x1); },

        [&](const DateTime&) { RESOLVE_INDEX_METHOD(int64_t, _I64x1); },

        [](auto&&) { M_unreachable("invalid type"); },

    }, *bounds.attribute.type);


#undef RESOLVE_INDEX_METHOD

}


template<idx::IndexMethod IndexMethod>

void IndexScan<IndexMethod>::execute(const Match<IndexScan<IndexMethod>> &M,

                                     setup_t setup, pipeline_t pipeline, teardown_t teardown)

{

    auto &schema = M.scan.schema();

    M_insist(schema == schema.drop_constants().deduplicate(), "Schema of `ScanOperator` must neither contain NULL nor duplicates");


    auto &table = M.scan.store().table();

    M_insist(not table.layout().is_finite(), "layout for `wasm::IndexScan` must be infinite");


    index_scan_resolve_attribute_type(M, std::move(setup), std::move(pipeline), std::move(teardown));

}


/*======================================================================================================================

 * Filter

 *====================================================================================================================*/


template<bool Predicated>

ConditionSet Filter<Predicated>::pre_condition(std::size_t child_idx, const std::tuple<const FilterOperator*>&)

{

     M_insist(child_idx == 0);


    ConditionSet pre_cond;


    if constexpr (not Predicated) {

        /*----- Branching filter does not support SIMD. -----*/

        pre_cond.add_condition(NoSIMD());

    }


    return pre_cond;

}


template<bool Predicated>

ConditionSet Filter<Predicated>::adapt_post_condition(const Match<Filter>&, const ConditionSet &post_cond_child)

{

    ConditionSet post_cond(post_cond_child);


    if constexpr (Predicated) {

        /*----- Predicated filter introduces predication. -----*/

        post_cond.add_or_replace_condition(m::Predicated(true));

    }


    return post_cond;

}


template<bool Predicated>

double Filter<Predicated>::cost(const Match<Filter> &M)

{

    const cnf::CNF &cond = M.filter.filter();

    const unsigned cost = std::accumulate(cond.cbegin(), cond.cend(), 0U, [](unsigned cost, const cnf::Clause &clause) {

        return cost + clause.size();

    });

    return cost;

}


template<bool Predicated>

void Filter<Predicated>::execute(const Match<Filter> &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)

{

    /*----- Set minimal number of SIMD lanes preferred to get fully utilized SIMD vectors for the filter condition. --*/

    CodeGenContext::Get().update_num_simd_lanes_preferred(16); // set own preference


    /*----- Execute filter. -----*/

    M.child->execute(

        /* setup=    */ std::move(setup),

        /* pipeline= */ [&, pipeline=std::move(pipeline)](){

            if constexpr (Predicated) {

                CodeGenContext::Get().env().add_predicate(M.filter.filter());

                pipeline();

            } else {

                M_insist(CodeGenContext::Get().num_simd_lanes() == 1, "invalid number of SIMD lanes");

                IF (CodeGenContext::Get().env().compile<_Boolx1>(M.filter.filter()).is_true_and_not_null()) {

                    pipeline();

                };

            }

        },

        /* teardown= */ std::move(teardown)

    );

}


/*======================================================================================================================

 * LazyDisjunctiveFilter

 *====================================================================================================================*/


ConditionSet LazyDisjunctiveFilter::pre_condition(std::size_t child_idx, const std::tuple<const FilterOperator*>&)

{

     M_insist(child_idx == 0);


    ConditionSet pre_cond;


    /*----- Lazy disjunctive filter does not support SIMD. -----*/

    pre_cond.add_condition(NoSIMD());


    return pre_cond;

}


double LazyDisjunctiveFilter::cost(const Match<LazyDisjunctiveFilter> &M)

{

    const cnf::CNF &cond = M.filter.filter();

    M_insist(cond.size() == 1, "disjunctive filter condition must be a single clause");

    return cond[0].size() / 2.0; // on avg. half the number of predicates in the clause XXX consider selectivities

}


void LazyDisjunctiveFilter::execute(const Match<LazyDisjunctiveFilter> &M, setup_t setup, pipeline_t pipeline,

                                    teardown_t teardown)

{

    const cnf::Clause &clause = M.filter.filter()[0];


    M.child->execute(

        /* setup=    */ std::move(setup),

        /* pipeline= */ [&, pipeline=std::move(pipeline)](){

            M_insist(CodeGenContext::Get().num_simd_lanes() == 1, "invalid number of SIMD lanes");

            BLOCK(lazy_disjunctive_filter)

            {

                BLOCK(lazy_disjunctive_filter_then)

                {

                    for (const cnf::Predicate &pred : clause) {

                        auto cond = CodeGenContext::Get().env().compile<_Boolx1>(*pred);

                        if (pred.negative())

                            GOTO(cond.is_false_and_not_null(), lazy_disjunctive_filter_then); // break to remainder of pipline

                        else

                            GOTO(cond.is_true_and_not_null(), lazy_disjunctive_filter_then); // break to remainder of pipline

                    }

                    GOTO(lazy_disjunctive_filter); // skip pipeline

                }

                pipeline();

            }

        },

        /* teardown= */ std::move(teardown)

    );

}


/*======================================================================================================================

 * Projection

 *====================================================================================================================*/


ConditionSet Projection::pre_condition(

    std::size_t child_idx,

    const std::tuple<const ProjectionOperator*> &partial_inner_nodes)

{

     M_insist(child_idx == 0);


    ConditionSet pre_cond;


    auto &projection = *std::get<0>(partial_inner_nodes);


    if (not projection.children().empty()) { // projections starting a pipeline produce only a single tuple, i.e. no SIMD

        /*----- Projection does only support SIMD if all expressions can be computed using SIMD instructions. -----*/

        auto is_simd_computable = [](const ast::Expr &e){

            bool simd_computable = true;

            visit(overloaded {

                [&](const ast::BinaryExpr &b) -> void {

                    if (b.lhs->type()->is_character_sequence() or b.rhs->type()->is_character_sequence()) {

                        simd_computable = false; // string operations are not SIMDfiable

                        throw visit_stop_recursion(); // abort recursion

                    }

                    if (b.common_operand_type->is_integral() and b.op().type == TK_SLASH) {

                        simd_computable = false; // integer division is not SIMDfiable

                        throw visit_stop_recursion(); // abort recursion

                    }

                    if (b.op().type == TK_PERCENT) {

                        simd_computable = false; // modulo is not SIMDfiable

                        throw visit_stop_recursion(); // abort recursion

                    }

                },

                [](auto&) -> void {

                    /* designators, constants, unary expressions, NULL(), INT(), already computed aggregates and results

                     * of a nested query are SIMDfiable; nothing to be done */

                },

            }, e, m::tag<m::ast::ConstPreOrderExprVisitor>());

            return simd_computable;

        };

        auto pred = [&](auto &p){ return not is_simd_computable(p.first); };

        if (std::any_of(projection.projections().cbegin(), projection.projections().cend(), pred))

            pre_cond.add_condition(NoSIMD());

    }


    return pre_cond;

}


ConditionSet Projection::adapt_post_condition(const Match<Projection> &M, const ConditionSet &post_cond_child)

{

    ConditionSet post_cond(post_cond_child);


    /*----- Project and rename in duplicated post condition. -----*/

    M_insist(M.projection.projections().size() == M.projection.schema().num_entries(),

             "projections must match the operator's schema");

    std::vector<std::pair<Schema::Identifier, Schema::Identifier>> old2new;

    auto p = M.projection.projections().begin();

    for (auto &e: M.projection.schema()) {

        auto pred = [&e](const auto &p) { return p.second == e.id; };

        if (std::find_if(old2new.cbegin(), old2new.cend(), pred) == old2new.cend()) {

            M_insist(p != M.projection.projections().end());

            old2new.emplace_back(Schema::Identifier(p->first.get()), e.id);

        }

        ++p;

    }

    post_cond.project_and_rename(old2new);


    if (not M.child) {

        /*----- Leaf projection does not introduce predication. -----*/

        post_cond.add_condition(Predicated(false));


        /*----- Leaf projection does not introduce SIMD. -----*/

        post_cond.add_condition(NoSIMD());

    }


    return post_cond;

}


void Projection::execute(const Match<Projection> &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)

{

    auto execute_projection = [&, pipeline=std::move(pipeline)](){

        auto &old_env = CodeGenContext::Get().env();

        Environment new_env; // fresh environment


        /*----- If predication is used, move predicate to newly created environment. -----*/

        if (old_env.predicated())

            new_env.add_predicate(old_env.extract_predicate());


        /*----- Add projections to newly created environment. -----*/

        M_insist(M.projection.projections().size() == M.projection.schema().num_entries(),

                 "projections must match the operator's schema");

        auto p = M.projection.projections().begin();

        for (auto &e: M.projection.schema()) {

            if (not new_env.has(e.id) and not e.id.is_constant()) { // no duplicate and no constant

                if (old_env.has(e.id)) {

                    /*----- Migrate compiled expression to new context. ------*/

                    new_env.add(e.id, old_env.get(e.id)); // to retain `e.id` for later compilation of expressions

                } else {

                    /*----- Compile expression. -----*/

                    M_insist(p != M.projection.projections().end());

                    std::visit(overloaded {

                        [&]<typename T, std::size_t L>(Expr<T, L> value) -> void {

                            if (value.can_be_null()) {

                                Var<Expr<T, L>> var(value); // introduce variable s.t. uses only load from it

                                new_env.add(e.id, var);

                            } else {

                                /* introduce variable w/o NULL bit s.t. uses only load from it */

                                Var<PrimitiveExpr<T, L>> var(value.insist_not_null());

                                new_env.add(e.id, Expr<T, L>(var));

                            }

                        },

                        [&](NChar value) -> void {

                            Var<Ptr<Charx1>> var(value.val()); // introduce variable s.t. uses only load from it

                            new_env.add(e.id, NChar(var, value.can_be_null(), value.length(),

                                                    value.guarantees_terminating_nul()));

                        },

                        [](std::monostate) -> void { M_unreachable("invalid expression"); },

                    }, old_env.compile(p->first));

                }

            }

            ++p;

        }


        /*----- Resume pipeline with newly created environment. -----*/

        {

            auto S = CodeGenContext::Get().scoped_environment(std::move(new_env));

            pipeline();

        }

    };


    if (M.child) {

        /*----- Set minimal number of SIMD lanes preferred to get fully utilized SIMD vectors *after* the projection. */

        uint64_t min_size_in_bytes = 16;

        for (auto &p : M.projection.projections()) {

            visit(overloaded {

                [](const m::ast::ErrorExpr&) -> void { M_unreachable("no errors at this stage"); },

                [](const m::ast::Designator&) -> void { /* nothing to be done */ },

                [](const m::ast::Constant&) -> void { /* nothing to be done */ },

                [](const m::ast::QueryExpr&) -> void { /* nothing to be done */ },

                [&min_size_in_bytes](const m::ast::FnApplicationExpr &fn) -> void {

                    if (fn.get_function().is_aggregate())

                        throw visit_skip_subtree(); // skip arguments to already computed aggregate

                    min_size_in_bytes = std::min(min_size_in_bytes, (fn.type()->size() + 7) / 8);

                    if (min_size_in_bytes == 1)

                        throw visit_stop_recursion(); // abort recursion

                },

                [&min_size_in_bytes](auto &e) -> void { // i.e. for unary and binary expressions

                    min_size_in_bytes = std::min(min_size_in_bytes, (e.type()->size() + 7) / 8);

                    if (min_size_in_bytes == 1)

                        throw visit_stop_recursion(); // abort recursion

                }

            }, p.first.get(), m::tag<m::ast::ConstPreOrderExprVisitor>());

        }

        CodeGenContext::Get().update_num_simd_lanes_preferred(16 / min_size_in_bytes); // set own preference


        /*----- Execute projection. -----*/

        M.child->get()->execute(std::move(setup), std::move(execute_projection), std::move(teardown));

    } else {

        /*----- Execute projection. -----*/

        setup();

        CodeGenContext::Get().set_num_simd_lanes(1); // since only a single tuple is produced

        execute_projection();

        teardown();

    }

}


/*======================================================================================================================

 * Grouping

 *====================================================================================================================*/


ConditionSet HashBasedGrouping::pre_condition(std::size_t child_idx, const std::tuple<const GroupingOperator*>&)

{

     M_insist(child_idx == 0);


    ConditionSet pre_cond;


    /*----- Hash-based grouping does not support SIMD. -----*/

    pre_cond.add_condition(NoSIMD());


    return pre_cond;

}


double HashBasedGrouping::cost(const Match<HashBasedGrouping> &M)

{

    return 1.5 * M.child->get_matched_root().info().estimated_cardinality;

}


ConditionSet HashBasedGrouping::post_condition(const Match<HashBasedGrouping>&)

{

    ConditionSet post_cond;


    /*----- Hash-based grouping does not introduce predication (it is already handled by the hash table). -----*/

    post_cond.add_condition(Predicated(false));


    /*----- Hash-based grouping does not introduce SIMD. -----*/

    post_cond.add_condition(NoSIMD());


    return post_cond;

}


void HashBasedGrouping::execute(const Match<HashBasedGrouping> &M, setup_t setup, pipeline_t pipeline,

                                teardown_t teardown)

{

    // TODO: determine setup

    const uint64_t AGGREGATES_SIZE_THRESHOLD_IN_BITS =

        M.use_in_place_values ? std::numeric_limits<uint64_t>::max() : 0;


    const auto num_keys = M.grouping.group_by().size();


    /*----- Compute hash table schema and information about aggregates, especially AVG aggregates. -----*/

    Schema ht_schema;

    /* Add key(s). */

    for (std::size_t i = 0; i < num_keys; ++i) {

        auto &e = M.grouping.schema()[i];

        ht_schema.add(e.id, e.type, e.constraints);

    }

    /* Add payload. */

    auto p = compute_aggregate_info(M.grouping.aggregates(), M.grouping.schema(), num_keys);

    const auto &aggregates = p.first;

    const auto &avg_aggregates = p.second;

    uint64_t aggregates_size_in_bits = 0;

    for (auto &info : aggregates) {

        ht_schema.add(info.entry);

        aggregates_size_in_bits += info.entry.type->size();

    }


    /*----- Compute initial capacity of hash table. -----*/

    uint32_t initial_capacity = compute_initial_ht_capacity(M.grouping, M.load_factor);


    /*----- Create hash table. -----*/

    std::unique_ptr<HashTable> ht;

    std::vector<HashTable::index_t> key_indices(num_keys);

    std::iota(key_indices.begin(), key_indices.end(), 0);

    if (M.use_open_addressing_hashing) {

        if (aggregates_size_in_bits < AGGREGATES_SIZE_THRESHOLD_IN_BITS)

            ht = std::make_unique<GlobalOpenAddressingInPlaceHashTable>(ht_schema, std::move(key_indices),

                                                                        initial_capacity);

        else

            ht = std::make_unique<GlobalOpenAddressingOutOfPlaceHashTable>(ht_schema, std::move(key_indices),

                                                                           initial_capacity);

        if (M.use_quadratic_probing)

            as<OpenAddressingHashTableBase>(*ht).set_probing_strategy<QuadraticProbing>();

        else

            as<OpenAddressingHashTableBase>(*ht).set_probing_strategy<LinearProbing>();

    } else {

        ht = std::make_unique<GlobalChainedHashTable>(ht_schema, std::move(key_indices), initial_capacity);

    }


    /*----- Create child function. -----*/

    FUNCTION(hash_based_grouping_child_pipeline, void(void)) // create function for pipeline

    {

        auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function


        std::optional<HashTable::entry_t> dummy;


        M.child->execute(

            /* setup=    */ setup_t::Make_Without_Parent([&](){

                ht->setup();

                ht->set_high_watermark(M.load_factor);

                dummy.emplace(ht->dummy_entry()); // create dummy slot to ignore NULL values in aggregate computations

            }),

            /* pipeline= */ [&](){

                M_insist(bool(dummy));

                const auto &env = CodeGenContext::Get().env();


                /*----- Insert key if not yet done. -----*/

                std::vector<SQL_t> key;

                for (auto &p : M.grouping.group_by())

                    key.emplace_back(env.compile(p.first.get()));

                auto [entry, inserted] = ht->try_emplace(std::move(key));


                /*----- Compute aggregates. -----*/

                Block init_aggs("hash_based_grouping.init_aggs", false),

                      update_aggs("hash_based_grouping.update_aggs", false),

                      update_avg_aggs("hash_based_grouping.update_avg_aggs", false);

                for (auto &info : aggregates) {

                    bool is_min = false;

                    switch (info.fnid) {

                        default:

                            M_unreachable("unsupported aggregate function");

                        case m::Function::FN_MIN:

                            is_min = true; // set flag and delegate to MAX case

                        case m::Function::FN_MAX: {

                            M_insist(info.args.size() == 1,

                                     "MIN and MAX aggregate functions expect exactly one argument");

                            const auto &arg = *info.args[0];

                            std::visit(overloaded {

                                [&]<sql_type _T>(HashTable::reference_t<_T> &&r) -> void

                                requires (not (std::same_as<_T, _Boolx1> or std::same_as<_T, NChar>)) {

                                    using type = typename _T::type;

                                    using T = PrimitiveExpr<type>;


                                    auto _arg = env.compile(arg);

                                    _T _new_val = convert<_T>(_arg);


                                    BLOCK_OPEN(init_aggs) {

                                        auto [val_, is_null] = _new_val.clone().split();

                                        T val(val_); // due to structured binding and lambda closure

                                        IF (is_null) {

                                            auto neutral = is_min ? T(std::numeric_limits<type>::max())

                                                                  : T(std::numeric_limits<type>::lowest());

                                            r.clone().set_value(neutral); // initialize with neutral element +inf or -inf

                                            if (info.entry.nullable())

                                                r.clone().set_null(); // first value is NULL

                                        } ELSE {

                                            r.clone().set_value(val); // initialize with first value

                                            if (info.entry.nullable())

                                                r.clone().set_not_null(); // first value is not NULL

                                        };

                                    }

                                    BLOCK_OPEN(update_aggs) {

                                        if (_new_val.can_be_null()) {

                                            M_insist_no_ternary_logic();

                                            auto [new_val_, new_val_is_null_] = _new_val.split();

                                            auto [old_min_max_, old_min_max_is_null] = _T(r.clone()).split();

                                            const Var<Boolx1> new_val_is_null(new_val_is_null_); // due to multiple uses


                                            auto chosen_r = Select(new_val_is_null, dummy->extract<_T>(info.entry.id),

                                                                                    r.clone());

                                            if constexpr (std::floating_point<type>) {

                                                chosen_r.set_value(

                                                    is_min ? min(old_min_max_, new_val_) // update old min with new value

                                                           : max(old_min_max_, new_val_) // update old max with new value

                                                ); // if new value is NULL, only dummy is written

                                            } else {

                                                const Var<T> new_val(new_val_),

                                                             old_min_max(old_min_max_); // due to multiple uses

                                                auto cmp = is_min ? new_val < old_min_max : new_val > old_min_max;

#if 1

                                                chosen_r.set_value(

                                                    Select(cmp,

                                                           new_val, // update to new value

                                                           old_min_max) // do not update

                                                ); // if new value is NULL, only dummy is written

#else

                                                IF (cmp) {

                                                    r.set_value(new_val);

                                                };

#endif

                                            }

                                            r.set_null_bit(

                                                old_min_max_is_null and new_val_is_null // MIN/MAX is NULL iff all values are NULL

                                            );

                                        } else {

                                            auto new_val_ = _new_val.insist_not_null();

                                            auto old_min_max_ = _T(r.clone()).insist_not_null();

                                            if constexpr (std::floating_point<type>) {

                                                r.set_value(

                                                    is_min ? min(old_min_max_, new_val_) // update old min with new value

                                                           : max(old_min_max_, new_val_) // update old max with new value

                                                );

                                            } else {

                                                const Var<T> new_val(new_val_),

                                                             old_min_max(old_min_max_); // due to multiple uses

                                                auto cmp = is_min ? new_val < old_min_max : new_val > old_min_max;

#if 1

                                                r.set_value(

                                                    Select(cmp,

                                                           new_val, // update to new value

                                                           old_min_max) // do not update

                                                );

#else

                                                IF (cmp) {

                                                    r.set_value(new_val);

                                                };

#endif

                                            }

                                            /* do not update NULL bit since it is already set to `false` */

                                        }

                                    }

                                },

                                []<sql_type _T>(HashTable::reference_t<_T>&&) -> void

                                requires std::same_as<_T,_Boolx1> or std::same_as<_T, NChar> {

                                    M_unreachable("invalid type");

                                },

                                [](std::monostate) -> void { M_unreachable("invalid reference"); },

                            }, entry.extract(info.entry.id));

                            break;

                        }

                        case m::Function::FN_AVG: {

                            auto it = avg_aggregates.find(info.entry.id);

                            M_insist(it != avg_aggregates.end());

                            const auto &avg_info = it->second;

                            M_insist(avg_info.compute_running_avg,

                                     "AVG aggregate may only occur for running average computations");

                            M_insist(info.args.size() == 1, "AVG aggregate function expects exactly one argument");

                            const auto &arg = *info.args[0];


                            auto r = entry.extract<_Doublex1>(info.entry.id);

                            auto _arg = env.compile(arg);

                            _Doublex1 _new_val = convert<_Doublex1>(_arg);


                            BLOCK_OPEN(init_aggs) {

                                auto [val_, is_null] = _new_val.clone().split();

                                Doublex1 val(val_); // due to structured binding and lambda closure

                                IF (is_null) {

                                    r.clone().set_value(Doublex1(0.0)); // initialize with neutral element 0

                                    if (info.entry.nullable())

                                        r.clone().set_null(); // first value is NULL

                                } ELSE {

                                    r.clone().set_value(val); // initialize with first value

                                    if (info.entry.nullable())

                                        r.clone().set_not_null(); // first value is not NULL

                                };

                            }

                            BLOCK_OPEN(update_avg_aggs) {

                                /* Compute AVG as iterative mean as described in Knuth, The Art of Computer Programming

                                 * Vol 2, section 4.2.2. */

                                if (_new_val.can_be_null()) {

                                    M_insist_no_ternary_logic();

                                    auto [new_val, new_val_is_null_] = _new_val.split();

                                    auto [old_avg_, old_avg_is_null] = _Doublex1(r.clone()).split();

                                    const Var<Boolx1> new_val_is_null(new_val_is_null_); // due to multiple uses

                                    const Var<Doublex1> old_avg(old_avg_); // due to multiple uses


                                    auto delta_absolute = new_val - old_avg;

                                    auto running_count = _I64x1(entry.get<_I64x1>(avg_info.running_count)).insist_not_null();

                                    auto delta_relative = delta_absolute / running_count.to<double>();


                                    auto chosen_r = Select(new_val_is_null, dummy->extract<_Doublex1>(info.entry.id),

                                                                            r.clone());

                                    chosen_r.set_value(

                                        old_avg + delta_relative // update old average with new value

                                    ); // if new value is NULL, only dummy is written

                                    r.set_null_bit(

                                        old_avg_is_null and new_val_is_null // AVG is NULL iff all values are NULL

                                    );

                                } else {

                                    auto new_val = _new_val.insist_not_null();

                                    auto old_avg_ = _Doublex1(r.clone()).insist_not_null();

                                    const Var<Doublex1> old_avg(old_avg_); // due to multiple uses


                                    auto delta_absolute = new_val - old_avg;

                                    auto running_count = _I64x1(entry.get<_I64x1>(avg_info.running_count)).insist_not_null();

                                    auto delta_relative = delta_absolute / running_count.to<double>();

                                    r.set_value(

                                        old_avg + delta_relative // update old average with new value

                                    );

                                    /* do not update NULL bit since it is already set to `false` */

                                }

                            }

                            break;

                        }

                        case m::Function::FN_SUM: {

                            M_insist(info.args.size() == 1, "SUM aggregate function expects exactly one argument");

                            const auto &arg = *info.args[0];

                            std::visit(overloaded {

                                [&]<sql_type _T>(HashTable::reference_t<_T> &&r) -> void

                                requires (not (std::same_as<_T, _Boolx1> or std::same_as<_T, NChar>)) {

                                    using type = typename _T::type;

                                    using T = PrimitiveExpr<type>;


                                    auto _arg = env.compile(arg);

                                    _T _new_val = convert<_T>(_arg);


                                    BLOCK_OPEN(init_aggs) {

                                        auto [val_, is_null] = _new_val.clone().split();

                                        T val(val_); // due to structured binding and lambda closure

                                        IF (is_null) {

                                            r.clone().set_value(T(type(0))); // initialize with neutral element 0

                                            if (info.entry.nullable())

                                                r.clone().set_null(); // first value is NULL

                                        } ELSE {

                                            r.clone().set_value(val); // initialize with first value

                                            if (info.entry.nullable())

                                                r.clone().set_not_null(); // first value is not NULL

                                        };

                                    }

                                    BLOCK_OPEN(update_aggs) {

                                        if (_new_val.can_be_null()) {

                                            M_insist_no_ternary_logic();

                                            auto [new_val, new_val_is_null_] = _new_val.split();

                                            auto [old_sum, old_sum_is_null] = _T(r.clone()).split();

                                            const Var<Boolx1> new_val_is_null(new_val_is_null_); // due to multiple uses


                                            auto chosen_r = Select(new_val_is_null, dummy->extract<_T>(info.entry.id),

                                                                                    r.clone());

                                            chosen_r.set_value(

                                                old_sum + new_val // add new value to old sum

                                            ); // if new value is NULL, only dummy is written

                                            r.set_null_bit(

                                                old_sum_is_null and new_val_is_null // SUM is NULL iff all values are NULL

                                            );

                                        } else {

                                            auto new_val = _new_val.insist_not_null();

                                            auto old_sum = _T(r.clone()).insist_not_null();

                                            r.set_value(

                                                old_sum + new_val // add new value to old sum

                                            );

                                            /* do not update NULL bit since it is already set to `false` */

                                        }

                                    }

                                },

                                []<sql_type _T>(HashTable::reference_t<_T>&&) -> void

                                requires std::same_as<_T,_Boolx1> or std::same_as<_T, NChar> {

                                    M_unreachable("invalid type");

                                },

                                [](std::monostate) -> void { M_unreachable("invalid reference"); },

                            }, entry.extract(info.entry.id));

                            break;

                        }

                        case m::Function::FN_COUNT: {

                            M_insist(info.args.size() <= 1, "COUNT aggregate function expects at most one argument");


                            auto r = entry.get<_I64x1>(info.entry.id); // do not extract to be able to access for AVG case


                            if (info.args.empty()) {

                                BLOCK_OPEN(init_aggs) {

                                    r.clone() = _I64x1(1); // initialize with 1 (for first value)

                                }

                                BLOCK_OPEN(update_aggs) {

                                    auto old_count = _I64x1(r.clone()).insist_not_null();

                                    r.set_value(

                                        old_count + int64_t(1) // increment old count by 1

                                    );

                                    /* do not update NULL bit since it is already set to `false` */

                                }

                            } else {

                                const auto &arg = *info.args[0];


                                auto _arg = env.compile(arg);

                                I64x1 new_val_not_null = not_null(_arg).to<int64_t>();


                                BLOCK_OPEN(init_aggs) {

                                    r.clone() = _I64x1(new_val_not_null.clone()); // initialize with 1 iff first value is present

                                }

                                BLOCK_OPEN(update_aggs) {

                                    auto old_count = _I64x1(r.clone()).insist_not_null();

                                    r.set_value(

                                        old_count + new_val_not_null // increment old count by 1 iff new value is present

                                    );

                                    /* do not update NULL bit since it is already set to `false` */

                                }

                            }

                            break;

                        }

                    }

                }


                /*----- If group has been inserted, initialize aggregates. Otherwise, update them. -----*/

                IF (inserted) {

                    init_aggs.attach_to_current();

                } ELSE {

                    update_aggs.attach_to_current();

                    update_avg_aggs.attach_to_current(); // after others to ensure that running count is incremented before

                };

            },

            /* teardown= */ teardown_t::Make_Without_Parent([&](){ ht->teardown(); })

        );

    }

    hash_based_grouping_child_pipeline(); // call child function


    auto &env = CodeGenContext::Get().env();


    /*----- Process each computed group. -----*/

    setup_t(std::move(setup), [&](){ ht->setup(); })();

    ht->for_each([&, pipeline=std::move(pipeline)](HashTable::const_entry_t entry){

        /*----- Compute key schema to detect duplicated keys. -----*/

        Schema key_schema;

        for (std::size_t i = 0; i < num_keys; ++i) {

            auto &e = M.grouping.schema()[i];

            key_schema.add(e.id, e.type, e.constraints);

        }


        /*----- Add computed group tuples to current environment. ----*/

        for (auto &e : M.grouping.schema().deduplicate()) {

            try {

                key_schema.find(e.id);

            } catch (invalid_argument&) {

                continue; // skip duplicated keys since they must not be used afterwards

            }


            if (auto it = avg_aggregates.find(e.id);

                it != avg_aggregates.end() and not it->second.compute_running_avg)

            { // AVG aggregates which is not yet computed, divide computed sum with computed count

                auto &avg_info = it->second;

                auto sum = std::visit(overloaded {

                    [&]<sql_type T>(HashTable::const_reference_t<T> &&r) -> _Doublex1

                    requires (std::same_as<T, _I64x1> or std::same_as<T, _Doublex1>) {

                        return T(r).template to<double>();

                    },

                    [](auto&&) -> _Doublex1 { M_unreachable("invalid type"); },

                    [](std::monostate&&) -> _Doublex1 { M_unreachable("invalid reference"); },

                }, entry.get(avg_info.sum));

                auto count = _I64x1(entry.get<_I64x1>(avg_info.running_count)).insist_not_null().to<double>();

                auto avg = sum / count;

                if (avg.can_be_null()) {

                    _Var<Doublex1> var(avg); // introduce variable s.t. uses only load from it

                    env.add(e.id, var);

                } else {

                    /* introduce variable w/o NULL bit s.t. uses only load from it */

                    Var<Doublex1> var(avg.insist_not_null());

                    env.add(e.id, _Doublex1(var));

                }

            } else { // part of key or already computed aggregate

                std::visit(overloaded {

                    [&]<typename T>(HashTable::const_reference_t<Expr<T>> &&r) -> void {

                        Expr<T> value = r;

                        if (value.can_be_null()) {

                            Var<Expr<T>> var(value); // introduce variable s.t. uses only load from it

                            env.add(e.id, var);

                        } else {

                            /* introduce variable w/o NULL bit s.t. uses only load from it */

                            Var<PrimitiveExpr<T>> var(value.insist_not_null());

                            env.add(e.id, Expr<T>(var));

                        }

                    },

                    [&](HashTable::const_reference_t<NChar> &&r) -> void {

                        NChar value(r);

                        Var<Ptr<Charx1>> var(value.val()); // introduce variable s.t. uses only load from it

                        env.add(e.id, NChar(var, value.can_be_null(), value.length(),

                                            value.guarantees_terminating_nul()));

                    },

                    [](std::monostate&&) -> void { M_unreachable("invalid reference"); },

                }, entry.get(e.id)); // do not extract to be able to access for not-yet-computed AVG aggregates

            }

        }


        /*----- Resume pipeline. -----*/

        pipeline();

    });

    teardown_t(std::move(teardown), [&](){ ht->teardown(); })();

}


ConditionSet OrderedGrouping::pre_condition(

    std::size_t child_idx,

    const std::tuple<const GroupingOperator*> &partial_inner_nodes)

{

     M_insist(child_idx == 0);


    ConditionSet pre_cond;


    /*----- Ordered grouping needs the data sorted on the grouping key (in either order). -----*/

    Sortedness::order_t orders;

    for (auto &p : std::get<0>(partial_inner_nodes)->group_by()) {

        Schema::Identifier id(p.first);

        if (orders.find(id) == orders.cend())

            orders.add(std::move(id), Sortedness::O_UNDEF);

    }

    pre_cond.add_condition(Sortedness(std::move(orders)));


    /*----- Ordered grouping does not support SIMD. -----*/

    pre_cond.add_condition(NoSIMD());


    return pre_cond;

}


double OrderedGrouping::cost(const Match<OrderedGrouping> &M)

{

    return 1.0 * M.child->get_matched_root().info().estimated_cardinality;

}


ConditionSet OrderedGrouping::adapt_post_condition(const Match<OrderedGrouping> &M, const ConditionSet &post_cond_child)

{

    ConditionSet post_cond;


    /*----- Ordered grouping does not introduce predication. -----*/

    post_cond.add_condition(Predicated(false));


    /*----- Preserve order of child for grouping keys. -----*/

    Sortedness::order_t orders;

    const auto &sortedness_child = post_cond_child.get_condition<Sortedness>();

    for (auto &[expr, alias] : M.grouping.group_by()) {

        auto it = sortedness_child.orders().find(Schema::Identifier(expr));

        M_insist(it != sortedness_child.orders().cend());

        Schema::Identifier id = alias.has_value() ? Schema::Identifier(alias.assert_not_none())

                                                  : Schema::Identifier(expr);

        if (orders.find(id) == orders.cend())

            orders.add(std::move(id), it->second); // drop duplicate since it must not be used afterwards

    }

    post_cond.add_condition(Sortedness(std::move(orders)));


    /*----- Ordered grouping does not introduce SIMD. -----*/

    post_cond.add_condition(NoSIMD());


    return post_cond;

}


void OrderedGrouping::execute(const Match<OrderedGrouping> &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)

{

    Environment results;

    const auto num_keys = M.grouping.group_by().size();


    /*----- Compute key schema to detect duplicated keys. -----*/

    Schema key_schema;

    for (std::size_t i = 0; i < num_keys; ++i) {

        auto &e = M.grouping.schema()[i];

        key_schema.add(e.id, e.type, e.constraints);

    }


    /*----- Compute information about aggregates, especially about AVG aggregates. -----*/

    auto p = compute_aggregate_info(M.grouping.aggregates(), M.grouping.schema(), num_keys);

    const auto &aggregates = p.first;

    const auto &avg_aggregates = p.second;


    /*----- Forward declare function to emit a group tuple in the current environment and resume the pipeline. -----*/

    FunctionProxy<void(void)> emit_group_and_resume_pipeline("emit_group_and_resume_pipeline");


    std::optional<Var<Boolx1>> first_iteration;

    Global<Boolx1> first_iteration_backup(true);


    using agg_t = agg_t_<false>;

    using agg_backup_t = agg_t_<true>;

    agg_t agg_values[aggregates.size()];

    agg_backup_t agg_value_backups[aggregates.size()];


    using key_t = key_t_<false>;

    using key_backup_t = key_t_<true>;

    key_t key_values[num_keys];

    key_backup_t key_value_backups[num_keys];


    auto store_locals_to_globals = [&](){

        /*----- Store local aggregate values to globals to access them in other function. -----*/

        for (std::size_t idx = 0; idx < aggregates.size(); ++idx) {

            auto &info = aggregates[idx];


            switch (info.fnid) {

                default:

                    M_unreachable("unsupported aggregate function");

                case m::Function::FN_MIN:

                case m::Function::FN_MAX: {

                    auto min_max = [&]<typename T>() {

                        auto &[min_max, is_null] = *M_notnull((

                            std::get_if<std::pair<Var<PrimitiveExpr<T>>, std::optional<Var<Boolx1>>>>(&agg_values[idx])

                        ));

                        auto &[min_max_backup, is_null_backup] = *M_notnull((

                            std::get_if<std::pair<Global<PrimitiveExpr<T>>,

                                                  std::optional<Global<Boolx1>>>>(&agg_value_backups[idx])

                        ));

                        M_insist(bool(is_null) == bool(is_null_backup));


                        min_max_backup = min_max;

                        if (is_null)

                            *is_null_backup = *is_null;

                    };

                    auto &n = as<const Numeric>(*info.entry.type);

                    switch (n.kind) {

                        case Numeric::N_Int:

                        case Numeric::N_Decimal:

                            switch (n.size()) {

                                default: M_unreachable("invalid size");

                                case  8: min_max.template operator()<int8_t >(); break;

                                case 16: min_max.template operator()<int16_t>(); break;

                                case 32: min_max.template operator()<int32_t>(); break;

                                case 64: min_max.template operator()<int64_t>(); break;

                            }

                            break;

                        case Numeric::N_Float:

                            if (n.size() <= 32)

                                min_max.template operator()<float>();

                            else

                                min_max.template operator()<double>();

                    }

                    break;

                }

                case m::Function::FN_AVG: {

                    auto &[avg, is_null] = *M_notnull((

                        std::get_if<std::pair<Var<Doublex1>, std::optional<Var<Boolx1>>>>(&agg_values[idx])

                    ));

                    auto &[avg_backup, is_null_backup] = *M_notnull((

                        std::get_if<std::pair<Global<Doublex1>, std::optional<Global<Boolx1>>>>(&agg_value_backups[idx])

                    ));

                    M_insist(bool(is_null) == bool(is_null_backup));


                    avg_backup = avg;

                    if (is_null)

                        *is_null_backup = *is_null;


                    break;

                }

                case m::Function::FN_SUM: {

                    M_insist(info.args.size() == 1, "SUM aggregate function expects exactly one argument");

                    const auto &arg = *info.args[0];


                    auto sum = [&]<typename T>() {

                        auto &[sum, is_null] = *M_notnull((

                            std::get_if<std::pair<Var<PrimitiveExpr<T>>, std::optional<Var<Boolx1>>>>(&agg_values[idx])

                        ));

                        auto &[sum_backup, is_null_backup] = *M_notnull((

                            std::get_if<std::pair<Global<PrimitiveExpr<T>>,

                                                  std::optional<Global<Boolx1>>>>(&agg_value_backups[idx])

                        ));

                        M_insist(bool(is_null) == bool(is_null_backup));


                        sum_backup = sum;

                        if (is_null)

                            *is_null_backup = *is_null;

                    };

                    auto &n = as<const Numeric>(*info.entry.type);

                    switch (n.kind) {

                        case Numeric::N_Int:

                        case Numeric::N_Decimal:

                            switch (n.size()) {

                                default: M_unreachable("invalid size");

                                case  8: sum.template operator()<int8_t >(); break;

                                case 16: sum.template operator()<int16_t>(); break;

                                case 32: sum.template operator()<int32_t>(); break;

                                case 64: sum.template operator()<int64_t>(); break;

                            }

                            break;

                        case Numeric::N_Float:

                            if (n.size() <= 32)

                                sum.template operator()<float>();

                            else

                                sum.template operator()<double>();

                    }

                    break;

                }

                case m::Function::FN_COUNT: {

                    auto &count = *M_notnull(std::get_if<Var<I64x1>>(&agg_values[idx]));

                    auto &count_backup = *M_notnull(std::get_if<Global<I64x1>>(&agg_value_backups[idx]));


                    count_backup = count;


                    break;

                }

            }

        }


        /*----- Store local key values to globals to access them in other function. -----*/

        auto store = [&]<typename T>(std::size_t idx) {

            auto &[key, is_null] = *M_notnull((

                std::get_if<std::pair<Var<PrimitiveExpr<T>>, std::optional<Var<Boolx1>>>>(&key_values[idx])

            ));

            auto &[key_backup, is_null_backup] = *M_notnull((

                std::get_if<std::pair<Global<PrimitiveExpr<T>>, std::optional<Global<Boolx1>>>>(&key_value_backups[idx])

            ));

            M_insist(bool(is_null) == bool(is_null_backup));


            key_backup = key;

            if (is_null)

                *is_null_backup = *is_null;

        };

        for (std::size_t idx = 0; idx < num_keys; ++idx) {

            visit(overloaded{

                [&](const Boolean&) { store.template operator()<bool>(idx); },

                [&](const Numeric &n) {

                    switch (n.kind) {

                        case Numeric::N_Int:

                        case Numeric::N_Decimal:

                            switch (n.size()) {

                                default: M_unreachable("invalid size");

                                case  8: store.template operator()<int8_t >(idx); break;

                                case 16: store.template operator()<int16_t>(idx); break;

                                case 32: store.template operator()<int32_t>(idx); break;

                                case 64: store.template operator()<int64_t>(idx); break;

                            }

                            break;

                        case Numeric::N_Float:

                            if (n.size() <= 32)

                                store.template operator()<float>(idx);

                            else

                                store.template operator()<double>(idx);

                    }

                },

                [&](const CharacterSequence &cs) {

                    auto &key = *M_notnull(std::get_if<Var<Ptr<Charx1>>>(&key_values[idx]));

                    auto &key_backup = *M_notnull(std::get_if<Global<Ptr<Charx1>>>(&key_value_backups[idx]));


                    key_backup = key;

                },

                [&](const Date&) { store.template operator()<int32_t>(idx); },

                [&](const DateTime&) { store.template operator()<int64_t>(idx); },

                [](auto&&) { M_unreachable("invalid type"); },

            }, *M.grouping.schema()[idx].type);

        }

    };


    M.child->execute(

        /* setup=    */ setup_t::Make_Without_Parent([&](){

            first_iteration.emplace(first_iteration_backup);


            /*----- Initialize aggregates and their backups. -----*/

            for (std::size_t idx = 0; idx < aggregates.size(); ++idx) {

                auto &info = aggregates[idx];

                const bool nullable = info.entry.nullable();


                bool is_min = false;

                switch (info.fnid) {

                    default:

                        M_unreachable("unsupported aggregate function");

                    case m::Function::FN_MIN:

                        is_min = true; // set flag and delegate to MAX case

                    case m::Function::FN_MAX: {

                        auto min_max = [&]<typename T>() {

                            auto neutral = is_min ? std::numeric_limits<T>::max()

                                                  : std::numeric_limits<T>::lowest();


                            Var<PrimitiveExpr<T>> min_max;

                            Global<PrimitiveExpr<T>> min_max_backup(neutral); // initialize with neutral element +inf or -inf

                            std::optional<Var<Boolx1>> is_null;

                            std::optional<Global<Boolx1>> is_null_backup;


                            /*----- Set local aggregate variables to global backups. -----*/

                            min_max = min_max_backup;

                            if (nullable) {

                                is_null_backup.emplace(true); // MIN/MAX is initially NULL

                                is_null.emplace(*is_null_backup);

                            }


                            /*----- Add global aggregate to result environment to access it in other function. -----*/

                            if (nullable)

                                results.add(info.entry.id, Select(*is_null_backup, Expr<T>::Null(), min_max_backup));

                            else

                                results.add(info.entry.id, min_max_backup.val());


                            /*----- Move aggregate variables to access them later. ----*/

                            new (&agg_values[idx]) agg_t(std::make_pair(std::move(min_max), std::move(is_null)));

                            new (&agg_value_backups[idx]) agg_backup_t(std::make_pair(

                                std::move(min_max_backup), std::move(is_null_backup)

                            ));

                        };

                        auto &n = as<const Numeric>(*info.entry.type);

                        switch (n.kind) {

                            case Numeric::N_Int:

                            case Numeric::N_Decimal:

                                switch (n.size()) {

                                    default: M_unreachable("invalid size");

                                    case  8: min_max.template operator()<int8_t >(); break;

                                    case 16: min_max.template operator()<int16_t>(); break;

                                    case 32: min_max.template operator()<int32_t>(); break;

                                    case 64: min_max.template operator()<int64_t>(); break;

                                }

                                break;

                            case Numeric::N_Float:

                                if (n.size() <= 32)

                                    min_max.template operator()<float>();

                                else

                                    min_max.template operator()<double>();

                        }

                        break;

                    }

                    case m::Function::FN_AVG: {

                        Var<Doublex1> avg;

                        Global<Doublex1> avg_backup(0.0); // initialize with neutral element 0

                        std::optional<Var<Boolx1>> is_null;

                        std::optional<Global<Boolx1>> is_null_backup;


                        /*----- Set local aggregate variables to global backups. -----*/

                        avg = avg_backup;

                        if (nullable) {

                            is_null_backup.emplace(true); // AVG is initially NULL

                            is_null.emplace(*is_null_backup);

                        }


                        /*----- Add global aggregate to result environment to access it in other function. -----*/

                        if (nullable)

                            results.add(info.entry.id, Select(*is_null_backup, _Doublex1::Null(), avg_backup));

                        else

                            results.add(info.entry.id, avg_backup.val());


                        /*----- Move aggregate variables to access them later. ----*/

                        new (&agg_values[idx]) agg_t(std::make_pair(std::move(avg), std::move(is_null)));

                        new (&agg_value_backups[idx]) agg_backup_t(std::make_pair(

                            std::move(avg_backup), std::move(is_null_backup)

                        ));


                        break;

                    }

                    case m::Function::FN_SUM: {

                        auto sum = [&]<typename T>() {

                            Var<PrimitiveExpr<T>> sum;

                            Global<PrimitiveExpr<T>> sum_backup(T(0)); // initialize with neutral element 0

                            std::optional<Var<Boolx1>> is_null;

                            std::optional<Global<Boolx1>> is_null_backup;


                            /*----- Set local aggregate variables to global backups. -----*/

                            sum = sum_backup;

                            if (nullable) {

                                is_null_backup.emplace(true); // SUM is initially NULL

                                is_null.emplace(*is_null_backup);

                            }


                            /*----- Add global aggregate to result environment to access it in other function. -----*/

                            if (nullable)

                                results.add(info.entry.id, Select(*is_null_backup, Expr<T>::Null(), sum_backup));

                            else

                                results.add(info.entry.id, sum_backup.val());


                            /*----- Move aggregate variables to access them later. ----*/

                            new (&agg_values[idx]) agg_t(std::make_pair(std::move(sum), std::move(is_null)));

                            new (&agg_value_backups[idx]) agg_backup_t(std::make_pair(

                                std::move(sum_backup), std::move(is_null_backup)

                            ));

                        };

                        auto &n = as<const Numeric>(*info.entry.type);

                        switch (n.kind) {

                            case Numeric::N_Int:

                            case Numeric::N_Decimal:

                                switch (n.size()) {

                                    default: M_unreachable("invalid size");

                                    case  8: sum.template operator()<int8_t >(); break;

                                    case 16: sum.template operator()<int16_t>(); break;

                                    case 32: sum.template operator()<int32_t>(); break;

                                    case 64: sum.template operator()<int64_t>(); break;

                                }

                                break;

                            case Numeric::N_Float:

                                if (n.size() <= 32)

                                    sum.template operator()<float>();

                                else

                                    sum.template operator()<double>();

                        }

                        break;

                    }

                    case m::Function::FN_COUNT: {

                        Var<I64x1> count;

                        Global<I64x1> count_backup(0); // initialize with neutral element 0

                        /* no `is_null` variables needed since COUNT will not be NULL */


                        /*----- Set local aggregate variable to global backup. -----*/

                        count = count_backup;


                        /*----- Add global aggregate to result environment to access it in other function. -----*/

                        results.add(info.entry.id, count_backup.val());


                        /*----- Move aggregate variables to access them later. ----*/

                        new (&agg_values[idx]) agg_t(std::move(count));

                        new (&agg_value_backups[idx]) agg_backup_t(std::move(count_backup));


                        break;

                    }

                }

            }


            /*----- Initialize keys and their backups. -----*/

            auto init = [&]<typename T>(std::size_t idx) {

                const bool nullable = M.grouping.schema()[idx].nullable();


                Var<PrimitiveExpr<T>> key;

                Global<PrimitiveExpr<T>> key_backup;

                std::optional<Var<Boolx1>> is_null;

                std::optional<Global<Boolx1>> is_null_backup;


                /*----- Set local key variables to global backups. -----*/

                key = key_backup;

                if (nullable) {

                    is_null_backup.emplace();

                    is_null.emplace(*is_null_backup);

                }


                try {

                    auto id = M.grouping.schema()[idx].id;

                    key_schema.find(id);


                    /*----- Add global key to result environment to access it in other function. -----*/

                    if (nullable)

                        results.add(id, Select(*is_null_backup, Expr<T>::Null(), key_backup));

                    else

                        results.add(id, key_backup.val());

                } catch (invalid_argument&) {

                    /* skip adding to result environment for duplicate keys since they must not be used afterwards */

                }


                /*----- Move key variables to access them later. ----*/

                new (&key_values[idx]) key_t(std::make_pair(std::move(key), std::move(is_null)));

                new (&key_value_backups[idx]) key_backup_t(std::make_pair(

                    std::move(key_backup), std::move(is_null_backup)

                ));

            };

            for (std::size_t idx = 0; idx < num_keys; ++idx) {

                visit(overloaded{

                    [&](const Boolean&) { init.template operator()<bool>(idx); },

                    [&](const Numeric &n) {

                        switch (n.kind) {

                            case Numeric::N_Int:

                            case Numeric::N_Decimal:

                                switch (n.size()) {

                                    default: M_unreachable("invalid size");

                                    case  8: init.template operator()<int8_t >(idx); break;

                                    case 16: init.template operator()<int16_t>(idx); break;

                                    case 32: init.template operator()<int32_t>(idx); break;

                                    case 64: init.template operator()<int64_t>(idx); break;

                                }

                                break;

                            case Numeric::N_Float:

                                if (n.size() <= 32)

                                    init.template operator()<float>(idx);

                                else

                                    init.template operator()<double>(idx);

                        }

                    },

                    [&](const CharacterSequence &cs) {

                        Var<Ptr<Charx1>> key;

                        Global<Ptr<Charx1>> key_backup;

                        /* no `is_null` variables needed since pointer types must not be NULL */


                        /*----- Set local key variable to global backup. -----*/

                        key = key_backup;


                        try {

                            auto id = M.grouping.schema()[idx].id;

                            key_schema.find(id);


                            /*----- Add global key to result environment to access it in other function. -----*/

                            NChar str(key_backup.val(), M.grouping.schema()[idx].nullable(), cs.length, cs.is_varying);

                            results.add(id, std::move(str));

                        } catch (invalid_argument&) {

                            /* skip adding to result environment for duplicate keys since they must not be used

                             * afterwards */

                        }


                        /*----- Move key variables to access them later. ----*/

                        new (&key_values[idx]) key_t(std::move(key));

                        new (&key_value_backups[idx]) key_backup_t(std::move(key_backup));

                    },

                    [&](const Date&) { init.template operator()<int32_t>(idx); },

                    [&](const DateTime&) { init.template operator()<int64_t>(idx); },

                    [](auto&&) { M_unreachable("invalid type"); },

                }, *M.grouping.schema()[idx].type);

            }

        }),

        /* pipeline= */ [&](){

            auto &env = CodeGenContext::Get().env();


            /*----- If predication is used, introduce pred. var. and update it before computing aggregates. -----*/

            std::optional<Var<Boolx1>> pred;

            if (env.predicated()) {

                M_insist(CodeGenContext::Get().num_simd_lanes() == 1, "invalid number of SIMD lanes");

                pred = env.extract_predicate<_Boolx1>().is_true_and_not_null();

            }


            /*----- Compute aggregates. -----*/

            Block reset_aggs("ordered_grouping.reset_aggs", false),

                  update_aggs("ordered_grouping.update_aggs", false),

                  update_avg_aggs("ordered_grouping.update_avg_aggs", false);

            for (std::size_t idx = 0; idx < aggregates.size(); ++idx) {

                auto &info = aggregates[idx];


                bool is_min = false;

                switch (info.fnid) {

                    default:

                        M_unreachable("unsupported aggregate function");

                    case m::Function::FN_MIN:

                        is_min = true; // set flag and delegate to MAX case

                    case m::Function::FN_MAX: {

                        M_insist(info.args.size() == 1, "MIN and MAX aggregate functions expect exactly one argument");

                        const auto &arg = *info.args[0];

                        auto min_max = [&]<typename T>() {

                            auto neutral = is_min ? std::numeric_limits<T>::max()

                                                  : std::numeric_limits<T>::lowest();


                            auto &[min_max, is_null] = *M_notnull((

                                std::get_if<std::pair<Var<PrimitiveExpr<T>>, std::optional<Var<Boolx1>>>>(&agg_values[idx])

                            ));


                            BLOCK_OPEN(reset_aggs) {

                                min_max = neutral;

                                if (is_null)

                                    is_null->set_true();

                            }


                            BLOCK_OPEN(update_aggs) {

                                auto _arg = env.compile(arg);

                                Expr<T> _new_val = convert<Expr<T>>(_arg);

                                M_insist(_new_val.can_be_null() == bool(is_null));

                                if (_new_val.can_be_null()) {

                                    M_insist_no_ternary_logic();

                                    auto _new_val_pred = pred ? Select(*pred, _new_val, Expr<T>::Null()) : _new_val;

                                    auto [new_val_, new_val_is_null_] = _new_val_pred.split();

                                    const Var<Boolx1> new_val_is_null(new_val_is_null_); // due to multiple uses


                                    if constexpr (std::floating_point<T>) {

                                        min_max = Select(new_val_is_null,

                                                         min_max, // ignore NULL

                                                         is_min ? min(min_max, new_val_) // update old min with new value

                                                                : max(min_max, new_val_)); // update old max with new value

                                    } else {

                                        const Var<PrimitiveExpr<T>> new_val(new_val_); // due to multiple uses

                                        auto cmp = is_min ? new_val < min_max : new_val > min_max;

#if 1

                                        min_max = Select(new_val_is_null,

                                                         min_max, // ignore NULL

                                                         Select(cmp,

                                                                new_val, // update to new value

                                                                min_max)); // do not update

#else

                                        IF (not new_val_is_null and cmp) {

                                            min_max = new_val;

                                        };

#endif

                                    }

                                    *is_null = *is_null and new_val_is_null; // MIN/MAX is NULL iff all values are NULL

                                } else {

                                    auto _new_val_pred = pred ? Select(*pred, _new_val, neutral) : _new_val;

                                    auto new_val_ = _new_val_pred.insist_not_null();

                                    if constexpr (std::floating_point<T>) {

                                        min_max = is_min ? min(min_max, new_val_) // update old min with new value

                                                         : max(min_max, new_val_); // update old max with new value

                                    } else {

                                        const Var<PrimitiveExpr<T>> new_val(new_val_); // due to multiple uses

                                        auto cmp = is_min ? new_val < min_max : new_val > min_max;

#if 1

                                        min_max = Select(cmp,

                                                         new_val, // update to new value

                                                         min_max); // do not update

#else

                                        IF (cmp) {

                                            min_max = new_val;

                                        };

#endif

                                    }

                                }

                            }

                        };

                        auto &n = as<const Numeric>(*info.entry.type);

                        switch (n.kind) {

                            case Numeric::N_Int:

                            case Numeric::N_Decimal:

                                switch (n.size()) {

                                    default: M_unreachable("invalid size");

                                    case  8: min_max.template operator()<int8_t >(); break;

                                    case 16: min_max.template operator()<int16_t>(); break;

                                    case 32: min_max.template operator()<int32_t>(); break;

                                    case 64: min_max.template operator()<int64_t>(); break;

                                }

                                break;

                            case Numeric::N_Float:

                                if (n.size() <= 32)

                                    min_max.template operator()<float>();

                                else

                                    min_max.template operator()<double>();

                        }

                        break;

                    }

                    case m::Function::FN_AVG:

                        break; // skip here and handle later

                    case m::Function::FN_SUM: {

                        M_insist(info.args.size() == 1, "SUM aggregate function expects exactly one argument");

                        const auto &arg = *info.args[0];


                        auto sum = [&]<typename T>() {

                            auto &[sum, is_null] = *M_notnull((

                                std::get_if<std::pair<Var<PrimitiveExpr<T>>, std::optional<Var<Boolx1>>>>(&agg_values[idx])

                            ));


                            BLOCK_OPEN(reset_aggs) {

                                sum = T(0);

                                if (is_null)

                                    is_null->set_true();

                            }


                            BLOCK_OPEN(update_aggs) {

                                auto _arg = env.compile(arg);

                                Expr<T> _new_val = convert<Expr<T>>(_arg);

                                M_insist(_new_val.can_be_null() == bool(is_null));

                                if (_new_val.can_be_null()) {

                                    M_insist_no_ternary_logic();

                                    auto _new_val_pred = pred ? Select(*pred, _new_val, Expr<T>::Null()) : _new_val;

                                    auto [new_val, new_val_is_null_] = _new_val_pred.split();

                                    const Var<Boolx1> new_val_is_null(new_val_is_null_); // due to multiple uses


                                    sum += Select(new_val_is_null,

                                                  T(0), // ignore NULL

                                                  new_val); // add new value to old sum

                                    *is_null = *is_null and new_val_is_null; // SUM is NULL iff all values are NULL

                                } else {

                                    auto _new_val_pred = pred ? Select(*pred, _new_val, T(0)) : _new_val;

                                    sum += _new_val_pred.insist_not_null(); // add new value to old sum

                                }

                            }

                        };

                        auto &n = as<const Numeric>(*info.entry.type);

                        switch (n.kind) {

                            case Numeric::N_Int:

                            case Numeric::N_Decimal:

                                switch (n.size()) {

                                    default: M_unreachable("invalid size");

                                    case  8: sum.template operator()<int8_t >(); break;

                                    case 16: sum.template operator()<int16_t>(); break;

                                    case 32: sum.template operator()<int32_t>(); break;

                                    case 64: sum.template operator()<int64_t>(); break;

                                }

                                break;

                            case Numeric::N_Float:

                                if (n.size() <= 32)

                                    sum.template operator()<float>();

                                else

                                    sum.template operator()<double>();

                        }

                        break;

                    }

                    case m::Function::FN_COUNT: {

                        M_insist(info.args.size() <= 1, "COUNT aggregate function expects at most one argument");

                        M_insist(info.entry.type->is_integral() and info.entry.type->size() == 64);


                        auto &count = *M_notnull(std::get_if<Var<I64x1>>(&agg_values[idx]));


                        BLOCK_OPEN(reset_aggs) {

                            count = int64_t(0);

                        }


                        BLOCK_OPEN(update_aggs) {

                            if (info.args.empty()) {

                                count += pred ? pred->to<int64_t>() : I64x1(1); // increment old count by 1 iff `pred` is true

                            } else {

                                auto _new_val = env.compile(*info.args[0]);

                                if (can_be_null(_new_val)) {

                                    M_insist_no_ternary_logic();

                                    I64x1 inc = pred ? (not_null(_new_val) and *pred).to<int64_t>()

                                                   : not_null(_new_val).to<int64_t>();

                                    count += inc; // increment old count by 1 iff new value is present and `pred` is true

                                } else {

                                    discard(_new_val); // since it is not needed in this case

                                    I64x1 inc = pred ? pred->to<int64_t>() : I64x1(1);

                                    count += inc; // increment old count by 1 iff new value is present and `pred` is true

                                }

                            }

                        }

                        break;

                    }

                }

            }


            /*----- Compute AVG aggregates after others to ensure that running count is already created. -----*/

            for (std::size_t idx = 0; idx < aggregates.size(); ++idx) {

                auto &info = aggregates[idx];


                if (info.fnid == m::Function::FN_AVG) {

                    M_insist(info.args.size() == 1, "AVG aggregate function expects exactly one argument");

                    const auto &arg = *info.args[0];

                    M_insist(info.entry.type->is_double());


                    auto it = avg_aggregates.find(info.entry.id);

                    M_insist(it != avg_aggregates.end());

                    const auto &avg_info = it->second;

                    M_insist(avg_info.compute_running_avg,

                             "AVG aggregate may only occur for running average computations");


                    auto &[avg, is_null] = *M_notnull((

                        std::get_if<std::pair<Var<Doublex1>, std::optional<Var<Boolx1>>>>(&agg_values[idx])

                    ));


                    BLOCK_OPEN(reset_aggs) {

                        avg = 0.0;

                        if (is_null)

                            is_null->set_true();

                    }


                    BLOCK_OPEN(update_avg_aggs) {

                        /* Compute AVG as iterative mean as described in Knuth, The Art of Computer Programming

                         * Vol 2, section 4.2.2. */

                        auto running_count_idx = std::distance(

                            aggregates.cbegin(),

                            std::find_if(aggregates.cbegin(), aggregates.cend(), [&avg_info](const auto &info){

                                return info.entry.id == avg_info.running_count;

                            })

                        );

                        M_insist(0 <= running_count_idx and running_count_idx < aggregates.size());

                        auto &running_count = *M_notnull(std::get_if<Var<I64x1>>(&agg_values[running_count_idx]));


                        auto _arg = env.compile(arg);

                        _Doublex1 _new_val = convert<_Doublex1>(_arg);

                        M_insist(_new_val.can_be_null() == bool(is_null));

                        if (_new_val.can_be_null()) {

                            M_insist_no_ternary_logic();

                            auto _new_val_pred = pred ? Select(*pred, _new_val, _Doublex1::Null()) : _new_val;

                            auto [new_val, new_val_is_null_] = _new_val_pred.split();

                            const Var<Boolx1> new_val_is_null(new_val_is_null_); // due to multiple uses


                            auto delta_absolute = new_val - avg;

                            auto delta_relative = delta_absolute / running_count.to<double>();


                            avg += Select(new_val_is_null,

                                          0.0, // ignore NULL

                                          delta_relative); // update old average with new value

                            *is_null = *is_null and new_val_is_null; // AVG is NULL iff all values are NULL

                        } else {

                            auto _new_val_pred = pred ? Select(*pred, _new_val, avg) : _new_val;

                            auto delta_absolute = _new_val_pred.insist_not_null() - avg;

                            auto delta_relative = delta_absolute / running_count.to<double>();


                            avg += delta_relative; // update old average with new value

                        }

                    }

                }

            }


            /*----- Compute whether new group starts and update key variables accordingly. -----*/

            std::optional<Boolx1> group_differs;

            Block update_keys("ordered_grouping.update_grouping_keys", false);

            for (std::size_t idx = 0; idx < num_keys; ++idx) {

                std::visit(overloaded {

                    [&]<typename T>(Expr<T> value) -> void {

                        auto &[key_val, key_is_null] = *M_notnull((

                            std::get_if<std::pair<Var<PrimitiveExpr<T>>, std::optional<Var<Boolx1>>>>(&key_values[idx])

                        ));

                        M_insist(value.can_be_null() == bool(key_is_null));


                        if (value.can_be_null()) {

                            M_insist_no_ternary_logic();

                            auto [val, is_null] = value.clone().split();

                            auto null_differs = is_null != *key_is_null;

                            Boolx1 key_differs = null_differs or (not *key_is_null and val != key_val);

                            if (group_differs)

                                group_differs.emplace(key_differs or *group_differs);

                            else

                                group_differs.emplace(key_differs);


                            BLOCK_OPEN(update_keys) {

                                std::tie(key_val, key_is_null) = value.split();

                            }

                        } else {

                            Boolx1 key_differs = key_val != value.clone().insist_not_null();

                            if (group_differs)

                                group_differs.emplace(key_differs or *group_differs);

                            else

                                group_differs.emplace(key_differs);


                            BLOCK_OPEN(update_keys) {

                               key_val = value.insist_not_null();

                            }

                        }

                    },

                    [&](NChar value) -> void {

                        auto &key = *M_notnull(std::get_if<Var<Ptr<Charx1>>>(&key_values[idx]));


                        auto [key_addr, key_is_nullptr] = key.val().split();

                        auto [addr, is_nullptr] = value.val().clone().split();

                        auto addr_differs = strncmp(

                            /* left=  */ NChar(addr, value.can_be_null(), value.length(),

                                               value.guarantees_terminating_nul()),

                            /* right= */ NChar(key_addr, value.can_be_null(), value.length(),

                                               value.guarantees_terminating_nul()),

                            /* len=   */ U32x1(value.length()),

                            /* op=    */ NE

                        );

                        auto [addr_differs_value, addr_differs_is_null] = addr_differs.split();

                        addr_differs_is_null.discard(); // use potentially-null value but it is overruled if it is NULL

                        auto nullptr_differs = is_nullptr != key_is_nullptr.clone();

                        Boolx1 key_differs = nullptr_differs or (not key_is_nullptr and addr_differs_value);

                        if (group_differs)

                            group_differs.emplace(key_differs or *group_differs);

                        else

                            group_differs.emplace(key_differs);


                        BLOCK_OPEN(update_keys) {

                            key = value.val();

                        }

                    },

                    [](auto) -> void { M_unreachable("SIMDfication currently not supported"); },

                    [](std::monostate) -> void { M_unreachable("invalid expression"); },

                }, env.compile(M.grouping.group_by()[idx].first.get()));

            }

            M_insist(bool(group_differs));


            /*----- Resume pipeline with computed group iff new one starts and emit code to reset aggregates. ---*/

            M_insist(bool(first_iteration));

            Boolx1 cond = *first_iteration or *group_differs; // `group_differs` defaulted in first iteration but overruled anyway

            IF (pred ? Select(*pred, cond, false) : cond) { // ignore entries for which predication predicate is not fulfilled

                IF (not *first_iteration) {

                    store_locals_to_globals();

                    emit_group_and_resume_pipeline();

                    reset_aggs.attach_to_current();

                };

                update_keys.attach_to_current();

                *first_iteration = false;

            };


            /*----- Emit code to update aggregates. -----*/

            update_aggs.attach_to_current();

            update_avg_aggs.attach_to_current(); // after others to ensure that running count is incremented before

        },

        /* teardown= */ teardown_t::Make_Without_Parent([&](){

            store_locals_to_globals();


            /*----- Destroy created aggregate values and their backups. -----*/

            for (std::size_t idx = 0; idx < aggregates.size(); ++idx) {

                agg_values[idx].~agg_t();

                agg_value_backups[idx].~agg_backup_t();

            }


            M_insist(bool(first_iteration));

            first_iteration_backup = *first_iteration;

            first_iteration.reset();

        })

    );


    /*----- If input was not empty, emit last group tuple in the current environment and resume the pipeline. -----*/

    IF (not first_iteration_backup) {

        emit_group_and_resume_pipeline();

    };


    /*----- Delayed definition of function to emit group and resume pipeline (since result environment is needed). ---*/

    auto fn = emit_group_and_resume_pipeline.make_function(); // outside BLOCK_OPEN-macro to register as current function

    BLOCK_OPEN(fn.body()) {

        auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function

        auto &env = CodeGenContext::Get().env();


        /*----- Emit setup code *before* possibly introducing temporary boolean variables to not overwrite them. -----*/

        setup();


        /*----- Add computed group tuple to current environment. ----*/

        for (auto &e : M.grouping.schema().deduplicate()) {

            try {

                key_schema.find(e.id);

            } catch (invalid_argument&) {

                continue; // skip duplicated keys since they must not be used afterwards

            }


            if (auto it = avg_aggregates.find(e.id);

                it != avg_aggregates.end() and not it->second.compute_running_avg)

            { // AVG aggregates which is not yet computed, divide computed sum with computed count

                auto &avg_info = it->second;

                auto sum = results.get(avg_info.sum);

                auto count = results.get<_I64x1>(avg_info.running_count).insist_not_null().to<double>();

                auto avg = convert<_Doublex1>(sum) / count;

                if (avg.can_be_null()) {

                    _Var<Doublex1> var(avg); // introduce variable s.t. uses only load from it

                    env.add(e.id, var);

                } else {

                    /* introduce variable w/o NULL bit s.t. uses only load from it */

                    Var<Doublex1> var(avg.insist_not_null());

                    env.add(e.id, _Doublex1(var));

                }

            } else { // part of key or already computed aggregate

                std::visit(overloaded {

                    [&]<typename T>(Expr<T> value) -> void {

                        if (value.can_be_null()) {

                            Var<Expr<T>> var(value); // introduce variable s.t. uses only load from it

                            env.add(e.id, var);

                        } else {

                            /* introduce variable w/o NULL bit s.t. uses only load from it */

                            Var<PrimitiveExpr<T>> var(value.insist_not_null());

                            env.add(e.id, Expr<T>(var));

                        }

                    },

                    [&](NChar value) -> void {

                        Var<Ptr<Charx1>> var(value.val()); // introduce variable s.t. uses only load from it

                        env.add(e.id, NChar(var, value.can_be_null(), value.length(),

                                            value.guarantees_terminating_nul()));

                    },

                    [](auto) -> void { M_unreachable("SIMDfication currently not supported"); },

                    [](std::monostate) -> void { M_unreachable("invalid reference"); },

                }, results.get(e.id)); // do not extract to be able to access for not-yet-computed AVG aggregates

            }

        }


        /*----- Resume pipeline. -----*/

        pipeline();


        /*----- Emit teardown code. -----*/

        teardown();

    }

}


/*======================================================================================================================

 * Aggregation

 *====================================================================================================================*/


ConditionSet Aggregation::pre_condition(std::size_t child_idx, const std::tuple<const AggregationOperator*>&)

{

     M_insist(child_idx == 0);


    ConditionSet pre_cond;


    return pre_cond;

}


ConditionSet Aggregation::post_condition(const Match<Aggregation> &M)

{

    ConditionSet post_cond;


    /*----- Aggregation does not introduce predication. -----*/

    post_cond.add_condition(Predicated(false));


    /*----- Aggregation does implicitly sort the data since only one tuple is produced. -----*/

    Sortedness::order_t orders;

    for (auto &e : M.aggregation.schema().deduplicate())

        orders.add(e.id, Sortedness::O_UNDEF);

    post_cond.add_condition(Sortedness(std::move(orders)));


    /*----- Aggregation does not introduce SIMD since only one tuple is produced. -----*/

    post_cond.add_condition(NoSIMD());


    return post_cond;

}


void Aggregation::execute(const Match<Aggregation> &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)

{

    Environment results;

    std::vector<std::function<void(void)>> finalize_aggregates;


    /*----- Compute information about aggregates, especially about AVG aggregates. -----*/

    auto p = compute_aggregate_info(M.aggregation.aggregates(), M.aggregation.schema());

    const auto &aggregates = p.first;

    const auto &avg_aggregates = p.second;


    /*----- Set minimal number of SIMD lanes preferred to get fully utilized SIMD vectors for the aggregate args. ----*/

    uint64_t min_size_in_bytes = 16;

    for (auto &fn : M.aggregation.aggregates()) {

        for (auto &e : fn.get().args) {

            visit(overloaded {

                [](const m::ast::ErrorExpr&) -> void { M_unreachable("no errors at this stage"); },

                [](const m::ast::Designator&) -> void { /* nothing to be done */ },

                [](const m::ast::Constant&) -> void { /* nothing to be done */ },

                [](const m::ast::QueryExpr&) -> void { /* nothing to be done */ },

                [&min_size_in_bytes](const m::ast::FnApplicationExpr &fn) -> void {

                    M_insist(not fn.get_function().is_aggregate(), "aggregate arguments must not be aggregates");

                    min_size_in_bytes = std::min(min_size_in_bytes, (fn.type()->size() + 7) / 8);

                    if (min_size_in_bytes == 1)

                        throw visit_stop_recursion(); // abort recursion

                },

                [&min_size_in_bytes](auto &e) -> void { // i.e. for unary and binary expressions

                    min_size_in_bytes = std::min(min_size_in_bytes, (e.type()->size() + 7) / 8);

                    if (min_size_in_bytes == 1)

                        throw visit_stop_recursion(); // abort recursion

                }

            }, *e, m::tag<m::ast::ConstPreOrderExprVisitor>());

        }

    }

    CodeGenContext::Get().update_num_simd_lanes_preferred(16 / min_size_in_bytes); // set own preference


    /*----- Set minimal number of SIMD lanes preferred to be able to compute running averages. ----*/

    if (std::any_of(avg_aggregates.begin(), avg_aggregates.end(), [](auto &i){ return i.second.compute_running_avg; }))

        CodeGenContext::Get().update_num_simd_lanes_preferred(4); // set own preference


    /*----- Create child function. -----*/

    FUNCTION(aggregation_child_pipeline, void(void)) // create function for pipeline

    {

        auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function


#ifndef NDEBUG

        std::size_t num_simd_lanes;

#endif

        void *_agg_values;

        void *_agg_value_backups;


        M.child->execute(

            /* setup=    */ setup_t::Make_Without_Parent([&]() {

                auto execute_setup = [&]<std::size_t L>() {

#ifndef NDEBUG

                    num_simd_lanes = L;

#endif


                    /*----- Initialize aggregates helper structures. -----*/

                    using agg_t = agg_t_<false, L>;

                    using agg_backup_t = agg_t_<true, L>;

                    auto agg_values = new agg_t[aggregates.size()];

                    auto agg_value_backups = new agg_backup_t[aggregates.size()];


                    /*----- Store aggregates helper structures for pipeline and teardown callbacks. -----*/

                    _agg_values = static_cast<void*>(agg_values);

                    _agg_value_backups = static_cast<void*>(agg_value_backups);


                    /*----- Initialize aggregates and their backups. -----*/

                    for (std::size_t idx = 0; idx < aggregates.size(); ++idx) {

                        auto &info = aggregates[idx];


                        bool is_min = false;

                        switch (info.fnid) {

                            default:

                                M_unreachable("unsupported aggregate function");

                            case m::Function::FN_MIN:

                                is_min = true; // set flag and delegate to MAX case

                            case m::Function::FN_MAX: {

                                auto min_max = [&]<typename T>() {

                                    auto neutral = is_min ? std::numeric_limits<T>::max()

                                                          : std::numeric_limits<T>::lowest();


                                    Var<PrimitiveExpr<T, L>> min_max;

                                    Global<PrimitiveExpr<T, L>> min_max_backup(

                                        neutral // initialize with neutral element +inf or -inf

                                    );

                                    Var<Bool<L>> is_null;

                                    Global<Bool<L>> is_null_backup(true); // MIN/MAX is initially NULL


                                    /*----- Set local aggregate variables to global backups. -----*/

                                    min_max = min_max_backup;

                                    is_null = is_null_backup;


                                    /*----- Add global aggregate to result env. to access it in other function. -----*/

                                    if constexpr (L == 1) { // scalar

                                        PrimitiveExpr<T> value = min_max_backup;

                                        Boolx1 is_null = is_null_backup;

                                        results.add(info.entry.id, Select(is_null, Expr<T>::Null(), value));

                                    } else { // vectorial

                                        /* Create lambda which emits the computation of the final *scalar* aggregate.

                                         * This can then be called in the pipeline function starting at the aggregation

                                         * operator s.t. the emitted variable is a local of the correct function.

                                         * Do not access the global variables inside the lambda using closure by

                                         * reference since they are already destroyed when the lambda will be called.

                                         * Instead, copy their values into the lambda. However, since DSL expressions

                                         * are not const-copy-constructible, we have to allocate them on the heap and

                                         * destroy them manually inside the lambda. */

                                        auto simd_min_max = new PrimitiveExpr<T, L>(min_max_backup.val());

                                        auto simd_is_null = new Bool<L>(is_null_backup.val());

                                        finalize_aggregates.emplace_back([&, is_min, simd_min_max, simd_is_null]() {

                                            PrimitiveExpr<T> value = [&]<std::size_t... Is>(std::index_sequence<Is...>) {

                                                Var<PrimitiveExpr<T>> res(simd_min_max->clone().template extract<0>());

                                                auto update = [&]<std::size_t I>(){

                                                    if constexpr (requires (PrimitiveExpr<T> v) { min(v, v); max(v, v); }) {

                                                        res = is_min ? min(res, simd_min_max->clone().template extract<I>())

                                                                     : max(res, simd_min_max->clone().template extract<I>());

                                                    } else {

                                                        const Var<PrimitiveExpr<T>> extracted(

                                                            simd_min_max->clone().template extract<I>()

                                                        ); // due to multiple uses

                                                        auto cmp = is_min ? extracted < res : extracted > res;

#if 1

                                                        res = Select(cmp, extracted, res);

#else

                                                        IF (cmp) {

                                                            res = extracted;

                                                        };

#endif

                                                    }

                                                };

                                                (update.template operator()<Is + 1>(), ...);

                                                return res;

                                            }(std::make_index_sequence<L - 1>{});

                                            simd_min_max->discard(); // since it was always cloned

                                            Boolx1 is_null = simd_is_null->all_true();

                                            results.add(info.entry.id, Select(is_null, Expr<T>::Null(), value));

                                            delete simd_min_max; // destroy heap-allocated variable

                                            delete simd_is_null; // destroy heap-allocated variable

                                        });

                                    }


                                    /*----- Move aggregate variables to access them later. ----*/

                                    new (&agg_values[idx]) agg_t(std::make_pair(

                                        std::move(min_max), std::move(is_null))

                                    );

                                    new (&agg_value_backups[idx]) agg_backup_t(std::make_pair(

                                        std::move(min_max_backup), std::move(is_null_backup)

                                    ));

                                };

                                auto &n = as<const Numeric>(*info.entry.type);

                                switch (n.kind) {

                                    case Numeric::N_Int:

                                    case Numeric::N_Decimal:

                                        switch (n.size()) {

                                            default: M_unreachable("invalid size");

                                            case  8: min_max.template operator()<int8_t >(); break;

                                            case 16: min_max.template operator()<int16_t>(); break;

                                            case 32: min_max.template operator()<int32_t>(); break;

                                            case 64: min_max.template operator()<int64_t>(); break;

                                        }

                                        break;

                                    case Numeric::N_Float:

                                        if (n.size() <= 32)

                                            min_max.template operator()<float>();

                                        else

                                            min_max.template operator()<double>();

                                }

                                break;

                            }

                            case m::Function::FN_AVG:

                                break; // skip here and handle later

                            case m::Function::FN_SUM: {

                                auto sum = [&]<typename T>() {

                                    Var<PrimitiveExpr<T, L>> sum;

                                    Global<PrimitiveExpr<T, L>> sum_backup(T(0)); // initialize with neutral element 0

                                    Var<Bool<L>> is_null;

                                    Global<Bool<L>> is_null_backup(true); // SUM is initially NULL


                                    /*----- Set local aggregate variables to global backups. -----*/

                                    sum = sum_backup;

                                    is_null = is_null_backup;


                                    /*----- Add global aggregate to result env. to access it in other function. -----*/

                                    if constexpr (L == 1) { // scalar

                                        PrimitiveExpr<T> value = sum_backup;

                                        Boolx1 is_null = is_null_backup;

                                        results.add(info.entry.id, Select(is_null, Expr<T>::Null(), value));

                                    } else { // vectorial

                                        PrimitiveExpr<T> value = [&]<std::size_t... Is>(std::index_sequence<Is...>) {

                                            return (sum_backup.template extract<Is>() + ...);

                                        }(std::make_index_sequence<L>{});

                                        Boolx1 is_null = is_null_backup.all_true();

                                        results.add(info.entry.id, Select(is_null, Expr<T>::Null(), value));

                                    }


                                    /*----- Move aggregate variables to access them later. ----*/

                                    new (&agg_values[idx]) agg_t(std::make_pair(std::move(sum), std::move(is_null)));

                                    new (&agg_value_backups[idx]) agg_backup_t(std::make_pair(

                                        std::move(sum_backup), std::move(is_null_backup)

                                    ));

                                };

                                auto &n = as<const Numeric>(*info.entry.type);

                                switch (n.kind) {

                                    case Numeric::N_Int:

                                    case Numeric::N_Decimal:

                                        switch (n.size()) {

                                            default: M_unreachable("invalid size");

                                            case  8: sum.template operator()<int8_t >(); break;

                                            case 16: sum.template operator()<int16_t>(); break;

                                            case 32: sum.template operator()<int32_t>(); break;

                                            case 64: sum.template operator()<int64_t>(); break;

                                        }

                                        break;

                                    case Numeric::N_Float:

                                        if (n.size() <= 32)

                                            sum.template operator()<float>();

                                        else

                                            sum.template operator()<double>();

                                }

                                break;

                            }

                            case m::Function::FN_COUNT: {

                                Var<I64<L>> count;

                                Global<I64<L>> count_backup(0); // initialize with neutral element 0

                                /* no `is_null` variables needed since COUNT will not be NULL */


                                /*----- Set local aggregate variable to global backup. -----*/

                                count = count_backup;


                                /*----- Add global aggregate to result env. to access it in other function. -----*/

                                if constexpr (L == 1) { // scalar

                                    I64x1 value = count_backup;

                                    results.add(info.entry.id, value);

                                } else { // vectorial

                                    I64x1 value = [&]<std::size_t... Is>(std::index_sequence<Is...>) {

                                        return (count_backup.template extract<Is>() + ...);

                                    }(std::make_index_sequence<L>{});

                                    results.add(info.entry.id, value);

                                }


                                /*----- Move aggregate variables to access them later. ----*/

                                new (&agg_values[idx]) agg_t(std::move(count));

                                new (&agg_value_backups[idx]) agg_backup_t(std::move(count_backup));


                                break;

                            }

                        }

                    }


                    /*----- Initialize AVG aggregates after others to ensure that running count is initialized before. */

                    for (std::size_t idx = 0; idx < aggregates.size(); ++idx) {

                        auto &info = aggregates[idx];


                        if (info.fnid == m::Function::FN_AVG) {

                            Var<Double<L>> avg;

                            Global<Double<L>> avg_backup(0.0); // initialize with neutral element 0

                            Var<Bool<L>> is_null;

                            Global<Bool<L>> is_null_backup(true); // AVG is initially NULL


                            /*----- Set local aggregate variables to global backups. -----*/

                            avg = avg_backup;

                            is_null = is_null_backup;


                            /*----- Add global aggregate to result env. to access it in other function. -----*/

                            if constexpr (L == 1) { // scalar

                                Doublex1 value = avg_backup;

                                Boolx1 is_null = is_null_backup;

                                results.add(info.entry.id, Select(is_null, _Doublex1::Null(), value));

                            } else { // vectorial

                                /* Create lambda which emits the computation of the final *scalar* aggregate.

                                 * This can then be called in the pipeline function starting at the aggregation

                                 * operator s.t. the emitted variable is a local of the correct function.

                                 * Do not access the global variables inside the lambda using closure by

                                 * reference since they are already destroyed when the lambda will be called.

                                 * Instead, copy their values into the lambda. However, since DSL expressions

                                 * are not const-copy-constructible, we have to allocate them on the heap and

                                 * destroy them manually inside the lambda. */

                                auto simd_avg = new Double<L>(avg_backup.val());

                                auto simd_is_null = new Bool<L>(is_null_backup.val());

                                auto simd_running_count = new I64<L>([&](){

                                    auto it = avg_aggregates.find(info.entry.id);

                                    M_insist(it != avg_aggregates.end());

                                    const auto &avg_info = it->second;

                                    M_insist(avg_info.compute_running_avg,

                                             "AVG aggregate may only occur for running average computations");


                                    auto running_count_idx = std::distance(

                                        aggregates.cbegin(),

                                        std::find_if(

                                            aggregates.cbegin(), aggregates.cend(), [&avg_info](const auto &info){

                                                return info.entry.id == avg_info.running_count;

                                        })

                                    );

                                    M_insist(0 <= running_count_idx and running_count_idx < aggregates.size());


                                    auto &running_count =

                                        *M_notnull(std::get_if<Global<I64<L>>>(&agg_value_backups[running_count_idx]));

                                    return running_count.val();

                                }());

                                finalize_aggregates.emplace_back([&, simd_avg, simd_is_null, simd_running_count]() {

                                    Doublex1 value = [&]<std::size_t... Is>(std::index_sequence<Is...>) {

                                        I64x1 count = (simd_running_count->clone().template extract<Is>() + ...);

                                        const Var<Double<L>> simd_sum([&](){

                                            if constexpr (L != 2) {

                                                return *simd_avg * simd_running_count->template to<double>();

                                            } else {

                                                M_unreachable("conversion from `I64<2>` to `Double<2>` not supported");

                                                return Double<L>(0.0); // this line is never reached; return dummy value

                                            }

                                        }());

                                        return (simd_sum.template extract<Is>() + ...) / count.to<double>();

                                    }(std::make_index_sequence<L>{});

                                    Boolx1 is_null = simd_is_null->all_true();

                                    results.add(info.entry.id, Select(is_null, _Doublex1::Null(), value));

                                    delete simd_avg; // destroy heap-allocated variable

                                    delete simd_is_null; // destroy heap-allocated variable

                                    delete simd_running_count; // destroy heap-allocated variable

                                });

                            }


                            /*----- Move aggregate variables to access them later. ----*/

                            new (&agg_values[idx]) agg_t(std::make_pair(std::move(avg), std::move(is_null)));

                            new (&agg_value_backups[idx]) agg_backup_t(std::make_pair(

                                std::move(avg_backup), std::move(is_null_backup)

                            ));

                        }

                    }

                };

                switch (CodeGenContext::Get().num_simd_lanes()) {

                    default: M_unreachable("unsupported number of SIMD lanes");

                    case  1: execute_setup.operator()<1>();  break;

                    case  2: execute_setup.operator()<2>();  break;

                    case  4: execute_setup.operator()<4>();  break;

                    case  8: execute_setup.operator()<8>();  break;

                    case 16: execute_setup.operator()<16>(); break;

                    case 32: execute_setup.operator()<32>(); break;

                }

            }),

            /* pipeline= */ [&](){

                auto execute_pipeline = [&]<std::size_t L>(){

#ifndef NDEBUG

                    M_insist(num_simd_lanes == L,

                             "number of SIMD lanes in pipeline callback must match the one in setup callback");

#endif


                    /*----- Get aggregates helper structures. -----*/

                    using agg_t = agg_t_<false, L>;

                    using agg_backup_t = agg_t_<true, L>;

                    auto agg_values = static_cast<agg_t*>(_agg_values);

                    auto agg_value_backups = static_cast<agg_backup_t*>(_agg_value_backups);


                    auto &env = CodeGenContext::Get().env();


                    /*----- If predication is used, introduce pred. var. and update it before computing aggregates. --*/

                    std::optional<Var<Bool<L>>> pred;

                    if (env.predicated()) {

                        if constexpr (sql_boolean_type<_Bool<L>>)

                            pred = env.extract_predicate<_Bool<L>>().is_true_and_not_null();

                        else

                            M_unreachable("invalid number of SIMD lanes");

                    }


                    /*----- Compute aggregates (except AVG). -----*/

                    for (std::size_t idx = 0; idx < aggregates.size(); ++idx) {

                        auto &info = aggregates[idx];


                        bool is_min = false;

                        switch (info.fnid) {

                            default:

                                M_unreachable("unsupported aggregate function");

                            case m::Function::FN_MIN:

                                is_min = true; // set flag and delegate to MAX case

                            case m::Function::FN_MAX: {

                                M_insist(info.args.size() == 1,

                                         "MIN and MAX aggregate functions expect exactly one argument");

                                const auto &arg = *info.args[0];

                                auto min_max = overloaded{

                                    [&]<typename T>() requires sql_type<Expr<T, L>> {

                                        auto &[min_max, is_null] = *M_notnull((

                                            std::get_if<

                                                std::pair<Var<PrimitiveExpr<T, L>>, Var<Bool<L>>>

                                            >(&agg_values[idx])

                                        ));


                                        auto _arg = env.compile(arg);

                                        Expr<T, L> _new_val = convert<Expr<T, L>>(_arg);

                                        if (_new_val.can_be_null()) {

                                            M_insist_no_ternary_logic();

                                            auto _new_val_pred =

                                                pred ? Select(*pred, _new_val, Expr<T, L>::Null()) : _new_val;

                                            auto [new_val_, new_val_is_null_] = _new_val_pred.split();

                                            const Var<Bool<L>> new_val_is_null(new_val_is_null_); // due to multiple uses


                                            if constexpr (requires (PrimitiveExpr<T, L> v) { min(v, v); max(v, v); }) {

                                                min_max = Select(new_val_is_null,

                                                                 min_max, // ignore NULL

                                                                 is_min ? min(min_max, new_val_) // update old min with new value

                                                                        : max(min_max, new_val_)); // update old max with new value

                                            } else {

                                                const Var<PrimitiveExpr<T, L>> new_val(new_val_); // due to multiple uses

                                                auto cmp = is_min ? new_val < min_max : new_val > min_max;

#if 1

                                                min_max = Select(new_val_is_null,

                                                                 min_max, // ignore NULL

                                                                 Select(cmp,

                                                                        new_val, // update to new value

                                                                        min_max)); // do not update

#else

                                                IF (not new_val_is_null and cmp) {

                                                    min_max = new_val;

                                                };

#endif

                                            }

                                            is_null = is_null and new_val_is_null; // MIN/MAX is NULL iff all values are NULL

                                        } else {

                                            auto neutral = is_min ? std::numeric_limits<T>::max()

                                                                  : std::numeric_limits<T>::lowest();

                                            auto _new_val_pred =

                                                pred ? Select(*pred, _new_val, PrimitiveExpr<T, L>(neutral)) : _new_val;

                                            auto new_val_ = _new_val_pred.insist_not_null();

                                            if constexpr (requires (PrimitiveExpr<T, L> v) { min(v, v); max(v, v); }) {

                                                min_max = is_min ? min(min_max, new_val_) // update old min with new value

                                                                 : max(min_max, new_val_); // update old max with new value

                                            } else {

                                                const Var<PrimitiveExpr<T, L>> new_val(new_val_); // due to multiple uses

                                                auto cmp = is_min ? new_val < min_max : new_val > min_max;

#if 1

                                                min_max = Select(cmp,

                                                                 new_val, // update to new value

                                                                 min_max); // do not update

#else

                                                IF (cmp) {

                                                    min_max = new_val;

                                                };

#endif

                                            }

                                            is_null.set_false(); // at least one non-NULL value is consumed

                                        }

                                    },

                                    []<typename>() { M_unreachable("invalid type for given number of SIMD lanes"); }

                                };

                                auto &n = as<const Numeric>(*info.entry.type);

                                switch (n.kind) {

                                    case Numeric::N_Int:

                                    case Numeric::N_Decimal:

                                        switch (n.size()) {

                                            default: M_unreachable("invalid size");

                                            case  8: min_max.template operator()<int8_t >(); break;

                                            case 16: min_max.template operator()<int16_t>(); break;

                                            case 32: min_max.template operator()<int32_t>(); break;

                                            case 64: min_max.template operator()<int64_t>(); break;

                                        }

                                        break;

                                    case Numeric::N_Float:

                                        if (n.size() <= 32)

                                            min_max.template operator()<float>();

                                        else

                                            min_max.template operator()<double>();

                                }

                                break;

                            }

                            case m::Function::FN_AVG:

                                break; // skip here and handle later

                            case m::Function::FN_SUM: {

                                M_insist(info.args.size() == 1, "SUM aggregate function expects exactly one argument");

                                const auto &arg = *info.args[0];


                                auto sum = overloaded{

                                    [&]<typename T>() requires sql_type<Expr<T, L>> {

                                        auto &[sum, is_null] = *M_notnull((

                                            std::get_if<

                                                std::pair<Var<PrimitiveExpr<T, L>>, Var<Bool<L>>>

                                            >(&agg_values[idx])

                                        ));


                                        auto _arg = env.compile(arg);

                                        Expr<T, L> _new_val = convert<Expr<T, L>>(_arg);

                                        if (_new_val.can_be_null()) {

                                            M_insist_no_ternary_logic();

                                            auto _new_val_pred =

                                                pred ? Select(*pred, _new_val, Expr<T, L>::Null()) : _new_val;

                                            auto [new_val, new_val_is_null_] = _new_val_pred.split();

                                            const Var<Bool<L>> new_val_is_null(new_val_is_null_); // due to multiple uses


                                            sum += Select(new_val_is_null,

                                                          PrimitiveExpr<T, L>(T(0)), // ignore NULL

                                                          new_val); // add new value to old sum

                                            is_null = is_null and new_val_is_null; // SUM is NULL iff all values are NULL

                                        } else {

                                            auto _new_val_pred =

                                                pred ? Select(*pred, _new_val, PrimitiveExpr<T, L>(T(0))) : _new_val;

                                            sum += _new_val_pred.insist_not_null(); // add new value to old sum

                                            is_null.set_false(); // at least one non-NULL value is consumed

                                        }

                                    },

                                    []<typename>() { M_unreachable("invalid type for given number of SIMD lanes"); }

                                };

                                auto &n = as<const Numeric>(*info.entry.type);

                                switch (n.kind) {

                                    case Numeric::N_Int:

                                    case Numeric::N_Decimal:

                                        switch (n.size()) {

                                            default: M_unreachable("invalid size");

                                            case  8: sum.template operator()<int8_t >(); break;

                                            case 16: sum.template operator()<int16_t>(); break;

                                            case 32: sum.template operator()<int32_t>(); break;

                                            case 64: sum.template operator()<int64_t>(); break;

                                        }

                                        break;

                                    case Numeric::N_Float:

                                        if (n.size() <= 32)

                                            sum.template operator()<float>();

                                        else

                                            sum.template operator()<double>();

                                }

                                break;

                            }

                            case m::Function::FN_COUNT: {

                                M_insist(info.args.size() <= 1, "COUNT aggregate function expects at most one argument");

                                M_insist(info.entry.type->is_integral() and info.entry.type->size() == 64);


                                auto &count = *M_notnull(std::get_if<Var<I64<L>>>(&agg_values[idx]));


                                if (info.args.empty()) {

                                    count += pred ? pred->template to<int64_t>() : I64<L>(1); // increment old count by 1 iff `pred` is true

                                } else {

                                    auto _new_val = env.compile(*info.args[0]);

                                    if (can_be_null(_new_val)) {

                                        M_insist_no_ternary_logic();

                                        I64<L> inc = pred ? (not_null<L>(_new_val) and *pred).template to<int64_t>()

                                                          : not_null<L>(_new_val).template to<int64_t>();

                                        count += inc; // increment old count by 1 iff new value is present and `pred` is true

                                    } else {

                                        discard(_new_val); // since it is not needed in this case

                                        I64<L> inc = pred ? pred->template to<int64_t>() : I64<L>(1);

                                        count += inc; // increment old count by 1 iff new value is present and `pred` is true

                                    }

                                }

                                break;

                            }

                        }

                    }


                    /*----- Compute AVG aggregates after others to ensure that running count is incremented before. --*/

                    for (std::size_t idx = 0; idx < aggregates.size(); ++idx) {

                        auto &info = aggregates[idx];


                        if (info.fnid == m::Function::FN_AVG) {

                            M_insist(info.args.size() == 1, "AVG aggregate function expects exactly one argument");

                            const auto &arg = *info.args[0];

                            M_insist(info.entry.type->is_double());


                            auto it = avg_aggregates.find(info.entry.id);

                            M_insist(it != avg_aggregates.end());

                            const auto &avg_info = it->second;

                            M_insist(avg_info.compute_running_avg,

                                     "AVG aggregate may only occur for running average computations");


                            auto &[avg, is_null] = *M_notnull((

                                std::get_if<std::pair<Var<Double<L>>, Var<Bool<L>>>>(&agg_values[idx])

                            ));


                            /* Compute AVG as iterative mean as described in Knuth, The Art of Computer Programming

                             * Vol 2, section 4.2.2. */

                            auto running_count_idx = std::distance(

                                aggregates.cbegin(),

                                std::find_if(aggregates.cbegin(), aggregates.cend(), [&avg_info](const auto &info){

                                    return info.entry.id == avg_info.running_count;

                                })

                            );

                            M_insist(0 <= running_count_idx and running_count_idx < aggregates.size());

                            Double<L> running_count = [&](){

                                auto &running_count =

                                    *M_notnull(std::get_if<Var<I64<L>>>(&agg_values[running_count_idx]));

                                if constexpr (L != 2) {

                                    return running_count.template to<double>();

                                } else {

                                    M_unreachable("conversion from `I64<2>` to `Double<2>` not supported");

                                    return Double<L>(0.0); // this line is never reached; return dummy value

                                }

                            }();


                            auto _arg = env.compile(arg);

                            _Double<L> _new_val = convert<_Double<L>>(_arg);

                            if (_new_val.can_be_null()) {

                                M_insist_no_ternary_logic();

                                auto _new_val_pred = pred ? Select(*pred, _new_val, _Double<L>::Null()) : _new_val;

                                auto [new_val, new_val_is_null_] = _new_val_pred.split();

                                const Var<Bool<L>> new_val_is_null(new_val_is_null_); // due to multiple uses


                                auto delta_absolute = new_val - avg;

                                auto delta_relative = delta_absolute / running_count;


                                avg += Select(new_val_is_null,

                                              Double<L>(0.0), // ignore NULL

                                              delta_relative); // update old average with new value

                                is_null = is_null and new_val_is_null; // AVG is NULL iff all values are NULL

                            } else {

                                auto _new_val_pred = pred ? Select(*pred, _new_val, avg) : _new_val;

                                auto delta_absolute = _new_val_pred.insist_not_null() - avg;

                                auto delta_relative = delta_absolute / running_count;


                                avg += delta_relative; // update old average with new value

                                is_null.set_false(); // at least one non-NULL value is consumed

                            }

                        }

                    }

                };

                switch (CodeGenContext::Get().num_simd_lanes()) {

                    default: M_unreachable("unsupported number of SIMD lanes");

                    case  1: execute_pipeline.operator()<1>();  break;

                    case  2: execute_pipeline.operator()<2>();  break;

                    case  4: execute_pipeline.operator()<4>();  break;

                    case  8: execute_pipeline.operator()<8>();  break;

                    case 16: execute_pipeline.operator()<16>(); break;

                    case 32: execute_pipeline.operator()<32>(); break;

                }

            },

            /* teardown= */ teardown_t::Make_Without_Parent([&](){

                auto execute_teardown = [&]<std::size_t L>(){

#ifndef NDEBUG

                    M_insist(num_simd_lanes == L,

                             "number of SIMD lanes in teardown callback must match the one in setup callback");

#endif


                    /*----- Get aggregates helper structures. -----*/

                    using agg_t = agg_t_<false, L>;

                    using agg_backup_t = agg_t_<true, L>;

                    auto agg_values = static_cast<agg_t*>(_agg_values);

                    auto agg_value_backups = static_cast<agg_backup_t*>(_agg_value_backups);


                    /*----- Store local aggregate values to globals to access them in other function. -----*/

                    for (std::size_t idx = 0; idx < aggregates.size(); ++idx) {

                        auto &info = aggregates[idx];


                        bool is_min = false;

                        switch (info.fnid) {

                            default:

                                M_unreachable("unsupported aggregate function");

                            case m::Function::FN_MIN:

                                is_min = true; // set flag and delegate to MAX case

                            case m::Function::FN_MAX: {

                                auto min_max = [&]<typename T>() {

                                    auto &[min_max_backup, is_null_backup] = *M_notnull((

                                        std::get_if<

                                            std::pair<Global<PrimitiveExpr<T, L>>, Global<Bool<L>>>

                                        >(&agg_value_backups[idx])

                                    ));

                                    std::tie(min_max_backup, is_null_backup) = *M_notnull((

                                        std::get_if<std::pair<Var<PrimitiveExpr<T, L>>, Var<Bool<L>>>>(&agg_values[idx])

                                    ));

                                };

                                auto &n = as<const Numeric>(*info.entry.type);

                                switch (n.kind) {

                                    case Numeric::N_Int:

                                    case Numeric::N_Decimal:

                                        switch (n.size()) {

                                            default: M_unreachable("invalid size");

                                            case  8: min_max.template operator()<int8_t >(); break;

                                            case 16: min_max.template operator()<int16_t>(); break;

                                            case 32: min_max.template operator()<int32_t>(); break;

                                            case 64: min_max.template operator()<int64_t>(); break;

                                        }

                                        break;

                                    case Numeric::N_Float:

                                        if (n.size() <= 32)

                                            min_max.template operator()<float>();

                                        else

                                            min_max.template operator()<double>();

                                }

                                break;

                            }

                            case m::Function::FN_AVG: {

                                auto &[avg_backup, is_null_backup] = *M_notnull((

                                    std::get_if<std::pair<Global<Double<L>>, Global<Bool<L>>>>(&agg_value_backups[idx])

                                ));

                                std::tie(avg_backup, is_null_backup) = *M_notnull((

                                    std::get_if<std::pair<Var<Double<L>>, Var<Bool<L>>>>(&agg_values[idx])

                                ));


                                break;

                            }

                            case m::Function::FN_SUM: {

                                M_insist(info.args.size() == 1, "SUM aggregate function expects exactly one argument");

                                const auto &arg = *info.args[0];


                                auto sum = [&]<typename T>() {

                                    auto &[sum_backup, is_null_backup] = *M_notnull((

                                        std::get_if<

                                            std::pair<Global<PrimitiveExpr<T, L>>, Global<Bool<L>>>

                                        >(&agg_value_backups[idx])

                                    ));

                                    std::tie(sum_backup, is_null_backup) = *M_notnull((

                                        std::get_if<std::pair<Var<PrimitiveExpr<T, L>>, Var<Bool<L>>>>(&agg_values[idx])

                                    ));

                                };

                                auto &n = as<const Numeric>(*info.entry.type);

                                switch (n.kind) {

                                    case Numeric::N_Int:

                                    case Numeric::N_Decimal:

                                        switch (n.size()) {

                                            default: M_unreachable("invalid size");

                                            case  8: sum.template operator()<int8_t >(); break;

                                            case 16: sum.template operator()<int16_t>(); break;

                                            case 32: sum.template operator()<int32_t>(); break;

                                            case 64: sum.template operator()<int64_t>(); break;

                                        }

                                        break;

                                    case Numeric::N_Float:

                                        if (n.size() <= 32)

                                            sum.template operator()<float>();

                                        else

                                            sum.template operator()<double>();

                                }

                                break;

                            }

                            case m::Function::FN_COUNT: {

                                auto &count_backup = *M_notnull(std::get_if<Global<I64<L>>>(&agg_value_backups[idx]));

                                count_backup = *M_notnull(std::get_if<Var<I64<L>>>(&agg_values[idx]));


                                break;

                            }

                        }

                    }


                    /*----- Destroy created aggregates and their backups. -----*/

                    for (std::size_t idx = 0; idx < aggregates.size(); ++idx) {

                        agg_values[idx].~agg_t();

                        agg_value_backups[idx].~agg_backup_t();

                    }


                    /*----- Free aggregates helper structures. -----*/

                    delete[] agg_values;

                    delete[] agg_value_backups;

                };

                switch (CodeGenContext::Get().num_simd_lanes()) {

                    default: M_unreachable("unsupported number of SIMD lanes");

                    case  1: execute_teardown.operator()<1>();  break;

                    case  2: execute_teardown.operator()<2>();  break;

                    case  4: execute_teardown.operator()<4>();  break;

                    case  8: execute_teardown.operator()<8>();  break;

                    case 16: execute_teardown.operator()<16>(); break;

                    case 32: execute_teardown.operator()<32>(); break;

                }

            })

        );

    }

    aggregation_child_pipeline(); // call child function


    /*----- Emit setup code *before* possibly introducing temporary boolean variables to not overwrite them. -----*/

    setup();


    /*----- Emit code to finalize aggregate computations. -----*/

    for (auto &fn : finalize_aggregates)

        fn();


    /*----- Add computed aggregates tuple to current environment. ----*/

    auto &env = CodeGenContext::Get().env();

    for (auto &e : M.aggregation.schema().deduplicate()) {

        if (auto it = avg_aggregates.find(e.id);

            it != avg_aggregates.end() and not it->second.compute_running_avg)

        { // AVG aggregates which is not yet computed, divide computed sum with computed count

            auto &avg_info = it->second;

            auto sum = results.get(avg_info.sum);

            auto count = results.get<_I64x1>(avg_info.running_count).insist_not_null().to<double>();

            auto avg = convert<_Doublex1>(sum) / count;

            M_insist(avg.can_be_null());

            _Var<Doublex1> var(avg); // introduce variable s.t. uses only load from it

            env.add(e.id, var);

        } else { // already computed aggregate

            std::visit(overloaded {

                [&]<typename T>(Expr<T> value) -> void {

                    if (value.can_be_null()) {

                        Var<Expr<T>> var(value); // introduce variable s.t. uses only load from it

                        env.add(e.id, var);

                    } else {

                        /* introduce variable w/o NULL bit s.t. uses only load from it */

                        Var<PrimitiveExpr<T>> var(value.insist_not_null());

                        env.add(e.id, Expr<T>(var));

                    }

                },

                [](auto) -> void { M_unreachable("only scalar and non-string values must occur"); },

                [](std::monostate) -> void { M_unreachable("invalid reference"); },

            }, results.get(e.id)); // do not extract to be able to access for not-yet-computed AVG aggregates

        }

    }


    /*----- Resume pipeline. -----*/

    CodeGenContext::Get().set_num_simd_lanes(1); // since only a single tuple is produced

    pipeline();


    /*----- Emit teardown code. -----*/

    teardown();

}


/*======================================================================================================================

 * Sorting

 *====================================================================================================================*/


template<bool CmpPredicated>

ConditionSet Quicksort<CmpPredicated>::pre_condition(std::size_t child_idx, const std::tuple<const SortingOperator*>&)

{

     M_insist(child_idx == 0);


    ConditionSet pre_cond;


    /*----- Sorting does not support SIMD. -----*/

    pre_cond.add_condition(NoSIMD());


    return pre_cond;

}


template<bool CmpPredicated>

ConditionSet Quicksort<CmpPredicated>::post_condition(const Match<Quicksort> &M)

{

    ConditionSet post_cond;


    /*----- Quicksort does not introduce predication. -----*/

    post_cond.add_condition(Predicated(false));


    /*----- Quicksort does sort the data. -----*/

    Sortedness::order_t orders;

    for (auto &o : M.sorting.order_by()) {

        Schema::Identifier id(o.first);

        if (orders.find(id) == orders.cend())

            orders.add(std::move(id), o.second ? Sortedness::O_ASC : Sortedness::O_DESC);

    }

    post_cond.add_condition(Sortedness(std::move(orders)));


    /*----- Sorting does not introduce SIMD. -----*/

    post_cond.add_condition(NoSIMD());


    return post_cond;

}


template<bool CmpPredicated>

void Quicksort<CmpPredicated>::execute(const Match<Quicksort> &M, setup_t setup, pipeline_t pipeline,

                                       teardown_t teardown)

{

    /*----- Create infinite buffer to materialize the current results but resume the pipeline later. -----*/

    M_insist(bool(M.materializing_factory), "`wasm::Quicksort` must have a factory for the materialized child");

    const auto buffer_schema = M.child->get_matched_root().schema().drop_constants().deduplicate();

    const auto sorting_schema = M.sorting.schema().drop_constants().deduplicate();

    GlobalBuffer buffer(

        buffer_schema, *M.materializing_factory, false, 0, std::move(setup), std::move(pipeline), std::move(teardown)

    );


    /*----- Create child function. -----*/

    FUNCTION(sorting_child_pipeline, void(void)) // create function for pipeline

    {

        auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function


        M.child->execute(

            /* setup=    */ setup_t::Make_Without_Parent([&](){ buffer.setup(); }),

            /* pipeline= */ [&](){ buffer.consume(); },

            /* teardown= */ teardown_t::Make_Without_Parent([&](){ buffer.teardown(); })

        );

    }

    sorting_child_pipeline(); // call child function


    /*----- Invoke quicksort algorithm with buffer to sort. -----*/

    quicksort<CmpPredicated>(buffer, M.sorting.order_by());


    /*----- Process sorted buffer. -----*/

    buffer.resume_pipeline(sorting_schema);

}


ConditionSet NoOpSorting::pre_condition(std::size_t child_idx,

                                        const std::tuple<const SortingOperator*> &partial_inner_nodes)

{

    M_insist(child_idx == 0);


    ConditionSet pre_cond;


    /*----- NoOpSorting, i.e. a noop to match sorting, needs the data already sorted. -----*/

    Sortedness::order_t orders;

    for (auto &o : std::get<0>(partial_inner_nodes)->order_by()) {

        Schema::Identifier id(o.first);

        if (orders.find(id) == orders.cend())

            orders.add(std::move(id), o.second ? Sortedness::O_ASC : Sortedness::O_DESC);

    }

    pre_cond.add_condition(Sortedness(std::move(orders)));


    return pre_cond;

}


void NoOpSorting::execute(const Match<NoOpSorting> &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)

{

    M.child->execute(std::move(setup), std::move(pipeline), std::move(teardown));

}


/*======================================================================================================================

 * Join

 *====================================================================================================================*/


template<bool Predicated>

ConditionSet NestedLoopsJoin<Predicated>::pre_condition(std::size_t, const std::tuple<const JoinOperator*>&)

{

    ConditionSet pre_cond;


    /*----- Nested-loops join does not support SIMD. -----*/

    pre_cond.add_condition(NoSIMD());


    return pre_cond;

}


template<bool Predicated>

ConditionSet NestedLoopsJoin<Predicated>::adapt_post_conditions(

    const Match<NestedLoopsJoin>&,

    std::vector<std::reference_wrapper<const ConditionSet>> &&post_cond_children)

{

    M_insist(post_cond_children.size() >= 2);


    ConditionSet post_cond(post_cond_children.back().get()); // preserve conditions of right-most child


    if constexpr (Predicated) {

        /*----- Predicated nested-loops join introduces predication. -----*/

        post_cond.add_or_replace_condition(m::Predicated(true));

    }


    return post_cond;

}


template<bool Predicated>

double NestedLoopsJoin<Predicated>::cost(const Match<NestedLoopsJoin> &M)

{

    double cost = 1;

    for (auto &child : M.children)

        cost *= child->get_matched_root().info().estimated_cardinality;

    return cost;

}


template<bool Predicated>

void NestedLoopsJoin<Predicated>::execute(const Match<NestedLoopsJoin> &M, setup_t setup, pipeline_t pipeline,

                                          teardown_t teardown)

{

    const auto num_left_children = M.children.size() - 1; // all children but right-most one


    std::vector<Schema> schemas; // to own adapted schemas

    schemas.reserve(num_left_children);

    std::vector<GlobalBuffer> buffers;

    buffers.reserve(num_left_children);


    /*----- Process all but right-most child. -----*/

    for (std::size_t i = 0; i < num_left_children; ++i) {

        /*----- Create function for each child. -----*/

        FUNCTION(nested_loop_join_child_pipeline, void(void))

        {

            auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function


            /*----- Create infinite buffer to materialize the current results. -----*/

            M_insist(bool(M.materializing_factories_[i]),

                     "`wasm::NestedLoopsJoin` must have a factory for each materialized child");

            const auto &schema = schemas.emplace_back(

                M.children[i]->get_matched_root().schema().drop_constants().deduplicate()

            );

            if (i == 0) {

                /*----- Exactly one child (here left-most one) checks join predicate and resumes pipeline. -----*/

                buffers.emplace_back(

                    /* schema=        */ schema,

                    /* factory=       */ *M.materializing_factories_[i],

                    /* load_simdfied= */ false,

                    /* num_tuples=    */ 0, // i.e. infinite

                    /* setup=         */ setup_t::Make_Without_Parent(),

                    /* pipeline=      */ [&, pipeline=std::move(pipeline)](){

                        if constexpr (Predicated) {

                            CodeGenContext::Get().env().add_predicate(M.join.predicate());

                            pipeline();

                        } else {

                            M_insist(CodeGenContext::Get().num_simd_lanes() == 1, "invalid number of SIMD lanes");

                            IF (CodeGenContext::Get().env().compile<_Boolx1>(M.join.predicate()).is_true_and_not_null()) {

                                pipeline();

                            };

                        }

                    },

                    /* teardown=      */ teardown_t::Make_Without_Parent()

                );

            } else {

                /*----- All but exactly one child (here left-most one) load lastly inserted buffer again. -----*/

                /* All buffers are "connected" with each other by setting the pipeline callback as calling the

                 * `resume_pipeline_inline()` method of the lastly inserted buffer. Therefore, calling

                 * `resume_pipeline_inline()` on the lastly inserted buffer will load one tuple from it, recursively

                 * call `resume_pipeline_inline()` on the buffer created before that which again loads one tuple from

                 * it, and so on until the buffer inserted first (here the one of the left-most child) will load one

                 * of its tuples and check the join predicate for this one cartesian-product-combination of result

                 * tuples. */

                buffers.emplace_back(

                    /* schema=        */ schema,

                    /* factory=       */ *M.materializing_factories_[i],

                    /* load_simdfied= */ false,

                    /* num_tuples=    */ 0, // i.e. infinite

                    /* setup=         */ setup_t::Make_Without_Parent(),

                    /* pipeline=      */ [&](){ buffers.back().resume_pipeline_inline(); },

                    /* teardown=      */ teardown_t::Make_Without_Parent()

                );

            }


            /*----- Materialize the current result tuple in pipeline. -----*/

            M.children[i]->execute(

                /* setup=    */ setup_t::Make_Without_Parent([&](){ buffers.back().setup(); }),

                /* pipeline= */ [&](){ buffers.back().consume(); },

                /* teardown= */ teardown_t::Make_Without_Parent([&](){ buffers.back().teardown(); })

            );

        }

        nested_loop_join_child_pipeline(); // call child function

    }


    /*----- Process right-most child. -----*/

    M.children.back()->execute(

        /* setup=    */ std::move(setup),

        /* pipeline= */ [&](){ buffers.back().resume_pipeline_inline(); },

        /* teardown= */ std::move(teardown)

    );

}


template<bool UniqueBuild, bool Predicated>

ConditionSet SimpleHashJoin<UniqueBuild, Predicated>::pre_condition(

    std::size_t,

    const std::tuple<const JoinOperator*, const Wildcard*, const Wildcard*> &partial_inner_nodes)

{

    ConditionSet pre_cond;


    /*----- Simple hash join can only be used for binary joins on equi-predicates. -----*/

    auto &join = *std::get<0>(partial_inner_nodes);

    if (not join.predicate().is_equi())

        return ConditionSet::Make_Unsatisfiable();


    if constexpr (UniqueBuild) {

        /*----- Decompose each clause of the join predicate of the form `A.x = B.y` into parts `A.x` and `B.y`. -----*/

        auto &build = *std::get<1>(partial_inner_nodes);

        for (auto &clause : join.predicate()) {

            M_insist(clause.size() == 1, "invalid equi-predicate");

            auto &literal = clause[0];

            auto &binary = as<const BinaryExpr>(literal.expr());

            M_insist((not literal.negative() and binary.tok == TK_EQUAL) or

                     (literal.negative() and binary.tok == TK_BANG_EQUAL), "invalid equi-predicate");

            M_insist(is<const Designator>(binary.lhs), "invalid equi-predicate");

            M_insist(is<const Designator>(binary.rhs), "invalid equi-predicate");

            Schema::Identifier id_first(*binary.lhs), id_second(*binary.rhs);

            const auto &entry_build = build.schema().has(id_first) ? build.schema()[id_first].second

                                                                   : build.schema()[id_second].second;


            /*----- Unique simple hash join can only be used on unique build key. -----*/

            if (not entry_build.unique())

                return ConditionSet::Make_Unsatisfiable();

        }

    }


    /*----- Simple hash join does not support SIMD. -----*/

    pre_cond.add_condition(NoSIMD());


    return pre_cond;

}


template<bool UniqueBuild, bool Predicated>

ConditionSet SimpleHashJoin<UniqueBuild, Predicated>::adapt_post_conditions(

    const Match<SimpleHashJoin>&,

    std::vector<std::reference_wrapper<const ConditionSet>> &&post_cond_children)

{

    M_insist(post_cond_children.size() == 2);


    ConditionSet post_cond(post_cond_children[1].get()); // preserve conditions of right child


    if constexpr (Predicated) {

        /*----- Predicated simple hash join introduces predication. -----*/

        post_cond.add_or_replace_condition(m::Predicated(true));

    } else {

        /*----- Branching simple hash join does not introduce predication (it is already handled by the hash table). -*/

        post_cond.add_or_replace_condition(m::Predicated(false));

    }


    return post_cond;

}


template<bool UniqueBuild, bool Predicated>

double SimpleHashJoin<UniqueBuild, Predicated>::cost(const Match<SimpleHashJoin> &M)

{

    if (options::simple_hash_join_ordering_strategy == option_configs::OrderingStrategy::BUILD_ON_LEFT)

        return (M.build.id() == M.children[0]->get_matched_root().id() ? 1.0 : 2.0) + (UniqueBuild ? 0.0 : 0.1);

    else if (options::simple_hash_join_ordering_strategy == option_configs::OrderingStrategy::BUILD_ON_RIGHT)

        return M.build.id() == M.children[1]->get_matched_root().id() ? 1.0 : 2.0 + (UniqueBuild ? 0.0 : 0.1);

    else

        return 1.5 * M.build.info().estimated_cardinality +

            (UniqueBuild ? 1.0 : 1.1) * M.probe.info().estimated_cardinality;

}


template<bool UniqueBuild, bool Predicated>

void SimpleHashJoin<UniqueBuild, Predicated>::execute(const Match<SimpleHashJoin> &M, setup_t setup,

                                                      pipeline_t pipeline, teardown_t teardown)

{

    // TODO: determine setup

    const uint64_t PAYLOAD_SIZE_THRESHOLD_IN_BITS =

        M.use_in_place_values ? std::numeric_limits<uint64_t>::max() : 0;


    M_insist(((M.join.schema() | M.join.predicate().get_required()) & M.build.schema()) == M.build.schema());

    M_insist(M.build.schema().drop_constants() == M.build.schema());

    const auto ht_schema = M.build.schema().deduplicate();


    /*----- Decompose each clause of the join predicate of the form `A.x = B.y` into parts `A.x` and `B.y`. -----*/

    const auto [build_keys, probe_keys] = decompose_equi_predicate(M.join.predicate(), ht_schema);


    /*----- Compute payload IDs and its total size in bits (ignoring padding). -----*/

    std::vector<Schema::Identifier> payload_ids;

    uint64_t payload_size_in_bits = 0;

    for (auto &e : ht_schema) {

        if (not contains(build_keys, e.id)) {

            payload_ids.push_back(e.id);

            payload_size_in_bits += e.type->size();

        }

    }


    /*----- Compute initial capacity of hash table. -----*/

    uint32_t initial_capacity = compute_initial_ht_capacity(M.build, M.load_factor);


    /*----- Create hash table for build child. -----*/

    std::unique_ptr<HashTable> ht;

    std::vector<HashTable::index_t> build_key_indices;

    for (auto &build_key : build_keys)

        build_key_indices.push_back(ht_schema[build_key].first);

    if (M.use_open_addressing_hashing) {

        if (payload_size_in_bits < PAYLOAD_SIZE_THRESHOLD_IN_BITS)

            ht = std::make_unique<GlobalOpenAddressingInPlaceHashTable>(ht_schema, std::move(build_key_indices),

                                                                        initial_capacity);

        else

            ht = std::make_unique<GlobalOpenAddressingOutOfPlaceHashTable>(ht_schema, std::move(build_key_indices),

                                                                           initial_capacity);

        if (M.use_quadratic_probing)

            as<OpenAddressingHashTableBase>(*ht).set_probing_strategy<QuadraticProbing>();

        else

            as<OpenAddressingHashTableBase>(*ht).set_probing_strategy<LinearProbing>();

    } else {

        ht = std::make_unique<GlobalChainedHashTable>(ht_schema, std::move(build_key_indices), initial_capacity);

    }


    /*----- Create function for build child. -----*/

    FUNCTION(simple_hash_join_child_pipeline, void(void)) // create function for pipeline

    {

        auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function


        M.children[0]->execute(

            /* setup=    */ setup_t::Make_Without_Parent([&](){

                ht->setup();

                ht->set_high_watermark(M.load_factor);

            }),

            /* pipeline= */ [&](){

                auto &env = CodeGenContext::Get().env();


                std::optional<Boolx1> build_key_not_null;

                for (auto &build_key : build_keys) {

                    auto val = env.get(build_key);

                    if (build_key_not_null)

                        build_key_not_null.emplace(*build_key_not_null and not_null(val));

                    else

                        build_key_not_null.emplace(not_null(val));

                }

                M_insist(bool(build_key_not_null));

                IF (*build_key_not_null) { // TODO: predicated version

                    /*----- Insert key. -----*/

                    std::vector<SQL_t> key;

                    for (auto &build_key : build_keys)

                        key.emplace_back(env.get(build_key));

                    auto entry = ht->emplace(std::move(key));


                    /*----- Insert payload. -----*/

                    for (auto &id : payload_ids) {

                        std::visit(overloaded {

                            [&]<sql_type T>(HashTable::reference_t<T> &&r) -> void { r = env.extract<T>(id); },

                            [](std::monostate) -> void { M_unreachable("invalid reference"); },

                        }, entry.extract(id));

                    }

                };

            },

            /* teardown= */ teardown_t::Make_Without_Parent([&](){ ht->teardown(); })

        );

    }

    simple_hash_join_child_pipeline(); // call child function


    M.children[1]->execute(

        /* setup=    */ setup_t(std::move(setup), [&](){ ht->setup(); }),

        /* pipeline= */ [&, pipeline=std::move(pipeline)](){

            auto &env = CodeGenContext::Get().env();


            auto emit_tuple_and_resume_pipeline = [&, pipeline=std::move(pipeline)](HashTable::const_entry_t entry){

                /*----- Add found entry from hash table, i.e. from build child, to current environment. -----*/

                for (auto &e : ht_schema) {

                    if (not entry.has(e.id)) { // entry may not contain build key in case `ht->find()` was used

                        M_insist(contains(build_keys, e.id));

                        M_insist(env.has(e.id), "build key must already be contained in the current environment");

                        continue;

                    }


                    std::visit(overloaded {

                        [&]<typename T>(HashTable::const_reference_t<Expr<T>> &&r) -> void {

                            Expr<T> value = r;

                            if (value.can_be_null()) {

                                Var<Expr<T>> var(value); // introduce variable s.t. uses only load from it

                                env.add(e.id, var);

                            } else {

                                /* introduce variable w/o NULL bit s.t. uses only load from it */

                                Var<PrimitiveExpr<T>> var(value.insist_not_null());

                                env.add(e.id, Expr<T>(var));

                            }

                        },

                        [&](HashTable::const_reference_t<NChar> &&r) -> void {

                            NChar value(r);

                            Var<Ptr<Charx1>> var(value.val()); // introduce variable s.t. uses only load from it

                            env.add(e.id, NChar(var, value.can_be_null(), value.length(),

                                                value.guarantees_terminating_nul()));

                        },

                        [](std::monostate) -> void { M_unreachable("invalid reference"); },

                    }, entry.extract(e.id));

                }


                /*----- Resume pipeline. -----*/

                pipeline();

            };


            /* TODO: may check for NULL on probe keys as well, branching + predicated version */

            /*----- Probe with probe key. -----*/

            std::vector<SQL_t> key;

            for (auto &probe_key : probe_keys)

                key.emplace_back(env.get(probe_key));

            if constexpr (UniqueBuild) {

                /*----- Add build key to current environment since `ht->find()` will only return the payload values. -----*/

                for (auto build_it = build_keys.cbegin(), probe_it = probe_keys.cbegin(); build_it != build_keys.cend();

                     ++build_it, ++probe_it)

                {

                    M_insist(probe_it != probe_keys.cend());

                    if (not env.has(*build_it)) // skip duplicated build keys and only add first occurrence

                        env.add(*build_it, env.get(*probe_it)); // since build and probe keys match for join partners

                }


                /*----- Try to find the *single* possible join partner. -----*/

                auto p = ht->find(std::move(key));

                auto &entry = p.first;

                auto &found = p.second;

                if constexpr (Predicated) {

                    env.add_predicate(found);

                    emit_tuple_and_resume_pipeline(std::move(entry));

                } else {

                    IF (found) {

                        emit_tuple_and_resume_pipeline(std::move(entry));

                    };

                }

            } else {

                /*----- Search for *all* join partners. -----*/

                ht->for_each_in_equal_range(std::move(key), std::move(emit_tuple_and_resume_pipeline), Predicated);

            }

        },

        /* teardown= */ teardown_t(std::move(teardown), [&](){ ht->teardown(); })

    );

}


template<bool SortLeft, bool SortRight, bool Predicated, bool CmpPredicated>

ConditionSet SortMergeJoin<SortLeft, SortRight, Predicated, CmpPredicated>::pre_condition(

    std::size_t child_idx,

    const std::tuple<const JoinOperator*, const Wildcard*, const Wildcard*> &partial_inner_nodes)

{

    ConditionSet pre_cond;


    /*----- Sort merge join can only be used for binary joins on conjunctions of equi-predicates. -----*/

    auto &join = *std::get<0>(partial_inner_nodes);

    if (not join.predicate().is_equi())

        return ConditionSet::Make_Unsatisfiable();


    /*----- Decompose each clause of the join predicate of the form `A.x = B.y` into parts `A.x` and `B.y`. -----*/

    auto parent = std::get<1>(partial_inner_nodes);

    auto child  = std::get<2>(partial_inner_nodes);

    M_insist(parent);

    M_insist(child_idx != 1 or child);

    std::vector<Schema::Identifier> keys_parent, keys_child;

    for (auto &clause : join.predicate()) {

        M_insist(clause.size() == 1, "invalid equi-predicate");

        auto &literal = clause[0];

        auto &binary = as<const BinaryExpr>(literal.expr());

        M_insist((not literal.negative() and binary.tok == TK_EQUAL) or

                 (literal.negative() and binary.tok == TK_BANG_EQUAL), "invalid equi-predicate");

        M_insist(is<const Designator>(binary.lhs), "invalid equi-predicate");

        M_insist(is<const Designator>(binary.rhs), "invalid equi-predicate");

        Schema::Identifier id_first(*binary.lhs), id_second(*binary.rhs);

        auto dummy = Schema::entry_type::CreateArtificial();

        const auto &[entry_parent, entry_child] = parent->schema().has(id_first)

            ? std::make_pair(parent->schema()[id_first].second, child_idx == 1 ? child->schema()[id_second].second : std::move(dummy))

            : std::make_pair(parent->schema()[id_second].second, child_idx == 1 ? child->schema()[id_first].second : std::move(dummy));

        keys_parent.push_back(entry_parent.id);

        keys_child.push_back(entry_child.id);


        /*----- Sort merge join can only be used on unique parent key. -----*/

        if (not entry_parent.unique())

            return ConditionSet::Make_Unsatisfiable();

    }

    M_insist(keys_parent.size() == keys_child.size(), "number of found IDs differ");

    M_insist(not keys_parent.empty(), "must find at least one ID");


    if constexpr (not SortLeft or not SortRight) {

        /*----- Sort merge join without sorting needs its data sorted on the respective key. -----*/

        Sortedness::order_t orders;

        M_insist(child_idx < 2);

        if (not SortLeft and child_idx == 0) {

            for (auto &key_parent : keys_parent) {

                if (orders.find(key_parent) == orders.cend())

                    orders.add(key_parent, Sortedness::O_ASC); // TODO: support different order

            }

        } else if (not SortRight and child_idx == 1) {

            for (auto &key_child : keys_child) {

                if (orders.find(key_child) == orders.cend())

                    orders.add(key_child, Sortedness::O_ASC); // TODO: support different order

            }

        }

        pre_cond.add_condition(Sortedness(std::move(orders)));

    }


    /*----- Sort merge join does not support SIMD. -----*/

    pre_cond.add_condition(NoSIMD());


    return pre_cond;

}


template<bool SortLeft, bool SortRight, bool Predicated, bool CmpPredicated>

ConditionSet SortMergeJoin<SortLeft, SortRight, Predicated, CmpPredicated>::adapt_post_conditions(

    const Match<SortMergeJoin> &M,

    std::vector<std::reference_wrapper<const ConditionSet>> &&post_cond_children)

{

    M_insist(post_cond_children.size() == 2);


    ConditionSet post_cond;


    if constexpr (Predicated) {

        /*----- Predicated sort merge join introduces predication. -----*/

        post_cond.add_or_replace_condition(m::Predicated(true));

    }


    /*----- Sort merge join does not introduce SIMD. -----*/

    post_cond.add_condition(NoSIMD());


    Sortedness::order_t orders;

    if constexpr (not SortLeft) {

        Sortedness sorting_left(post_cond_children[0].get().get_condition<Sortedness>());

        orders.merge(sorting_left.orders()); // preserve sortedness of left child (including order)

    }

    if constexpr (not SortRight) {

        Sortedness sorting_right(post_cond_children[1].get().get_condition<Sortedness>());

        orders.merge(sorting_right.orders()); // preserve sortedness of right child (including order)

    }

    if constexpr (SortLeft or SortRight) {

        /*----- Decompose each clause of the join predicate of the form `A.x = B.y` into parts `A.x` and `B.y`. -----*/

        auto [keys_parent, keys_child] = decompose_equi_predicate(M.join.predicate(), M.parent.schema());


        /*----- Sort merge join does sort the data on the respective key. -----*/

        if constexpr (SortLeft) {

            for (auto &key_parent : keys_parent) {

                if (orders.find(key_parent) == orders.cend())

                    orders.add(key_parent, Sortedness::O_ASC); // add sortedness for left child

            }

        }

        if constexpr (SortRight) {

            for (auto &key_child : keys_child) {

                if (orders.find(key_child) == orders.cend())

                    orders.add(key_child, Sortedness::O_ASC); // add sortedness for right child

            }

        }

    }

    post_cond.add_condition(Sortedness(std::move(orders)));


    return post_cond;

}


template<bool SortLeft, bool SortRight, bool Predicated, bool CmpPredicated>

double SortMergeJoin<SortLeft, SortRight, Predicated, CmpPredicated>::cost(const Match<SortMergeJoin> &M)

{

    const double card_left  = M.parent.info().estimated_cardinality;

    const double card_right = M.child.info().estimated_cardinality;


    double cost = card_left + card_right; // cost for merge

    if constexpr (SortLeft)

        cost += std::log2(card_left) * card_left; // cost for sort left

    if constexpr (SortRight)

        cost += std::log2(card_right) * card_right; // cost for sort right


    return cost;

}


template<bool SortLeft, bool SortRight, bool Predicated, bool CmpPredicated>

void SortMergeJoin<SortLeft, SortRight, Predicated, CmpPredicated>::execute(

    const Match<SortMergeJoin> &M,

    setup_t setup,

    pipeline_t pipeline,

    teardown_t teardown)

{

    auto &env = CodeGenContext::Get().env();

    const bool needs_buffer_parent = not is<const ScanOperator>(M.parent) or SortLeft;

    const bool needs_buffer_child  = not is<const ScanOperator>(M.child) or SortRight;


    /*----- Create infinite buffers to materialize the current results (if necessary). -----*/

    M_insist(bool(M.left_materializing_factory),

             "`wasm::SortMergeJoin` must have a factory for the materialized left child");

    M_insist(bool(M.right_materializing_factory),

             "`wasm::SortMergeJoin` must have a factory for the materialized right child");

    const auto schema_parent = M.parent.schema().drop_constants().deduplicate();

    const auto schema_child  = M.child.schema().drop_constants().deduplicate();

    std::optional<GlobalBuffer> buffer_parent, buffer_child;

    if (needs_buffer_parent)

        buffer_parent.emplace(schema_parent, *M.left_materializing_factory);

    if (needs_buffer_child)

        buffer_child.emplace(schema_child, *M.right_materializing_factory);


    /*----- Create child functions. -----*/

    if (needs_buffer_parent) {

        FUNCTION(sort_merge_join_parent_pipeline, void(void)) // create function for parent pipeline

        {

            auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function

            M.children[0]->execute(

                    /* setup=    */ setup_t::Make_Without_Parent([&](){ buffer_parent->setup(); }),

                    /* pipeline= */ [&](){ buffer_parent->consume(); },

                    /* teardown= */ teardown_t::Make_Without_Parent([&](){ buffer_parent->teardown(); })

            );

        }

        sort_merge_join_parent_pipeline(); // call parent function

    }

    if (needs_buffer_child) {

        FUNCTION(sort_merge_join_child_pipeline, void(void)) // create function for child pipeline

        {

            auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function

            M.children[1]->execute(

                /* setup=    */ setup_t::Make_Without_Parent([&](){ buffer_child->setup(); }),

                /* pipeline= */ [&](){ buffer_child->consume(); },

                /* teardown= */ teardown_t::Make_Without_Parent([&](){ buffer_child->teardown(); })

            );

        }

        sort_merge_join_child_pipeline(); // call child function

    }


    /*----- Decompose each clause of the join predicate of the form `A.x = B.y` into parts `A.x` and `B.y`. -----*/

    std::vector<SortingOperator::order_type> order_parent, order_child;

    for (auto &clause : M.join.predicate()) {

        M_insist(clause.size() == 1, "invalid equi-predicate");

        auto &literal = clause[0];

        auto &binary = as<const BinaryExpr>(literal.expr());

        M_insist((not literal.negative() and binary.tok == TK_EQUAL) or

                 (literal.negative() and binary.tok == TK_BANG_EQUAL), "invalid equi-predicate");

        M_insist(is<const Designator>(binary.lhs), "invalid equi-predicate");

        M_insist(is<const Designator>(binary.rhs), "invalid equi-predicate");

        auto [expr_parent, expr_child] = M.parent.schema().has(Schema::Identifier(*binary.lhs)) ?

            std::make_pair(binary.lhs.get(), binary.rhs.get()) : std::make_pair(binary.rhs.get(), binary.lhs.get());

        order_parent.emplace_back(*expr_parent, true); // ascending order

        order_child.emplace_back(*expr_child, true); // ascending order

    }

    M_insist(order_parent.size() == order_child.size(), "number of found IDs differ");

    M_insist(not order_parent.empty(), "must find at least one ID");


    /*----- If necessary, invoke sorting algorithm with buffer to sort. -----*/

    if constexpr (SortLeft)

        quicksort<CmpPredicated>(*buffer_parent, order_parent);

    if constexpr (SortRight)

        quicksort<CmpPredicated>(*buffer_child, order_child);


    /*----- Create predicate to check if child co-group is smaller or equal than the one of the parent relation. -----*/

    auto child_smaller_equal = [&]() -> Boolx1 {

        std::optional<Boolx1> child_smaller_equal_;

        for (std::size_t i = 0; i < order_child.size(); ++i) {

            auto &des_parent = as<const Designator>(order_parent[i].first);

            auto &des_child  = as<const Designator>(order_child[i].first);

            Token leq = Token::CreateArtificial(TK_LESS_EQUAL);

            auto cpy_parent = std::make_unique<Designator>(des_parent.tok, des_parent.table_name, des_parent.attr_name,

                                                           des_parent.type(), des_parent.target());

            auto cpy_child  = std::make_unique<Designator>(des_child.tok, des_child.table_name, des_child.attr_name,

                                                           des_child.type(), des_child.target());

            BinaryExpr expr(std::move(leq), std::move(cpy_child), std::move(cpy_parent));


            auto child = env.get(Schema::Identifier(des_child));

            Boolx1 cmp = env.compile<_Boolx1>(expr).is_true_and_not_null();

            if (child_smaller_equal_)

                child_smaller_equal_.emplace(*child_smaller_equal_ and (is_null(child) or cmp));

            else

                child_smaller_equal_.emplace(is_null(child) or cmp);

        }

        M_insist(bool(child_smaller_equal_));

        return *child_smaller_equal_;

    };


    /*----- Compile data layouts to generate sequential loads from buffers. -----*/

    static Schema empty_schema;

    Var<U32x1> tuple_id_parent, tuple_id_child; // default initialized to 0

    auto [inits_parent, loads_parent, _jumps_parent] = [&](){

       if (needs_buffer_parent) {

           return compile_load_sequential(buffer_parent->schema(), empty_schema, buffer_parent->base_address(),

                                          buffer_parent->layout(), 1, buffer_parent->schema(), tuple_id_parent);

       } else {

           auto &scan = as<const ScanOperator>(M.parent);

           return compile_load_sequential(schema_parent, empty_schema, get_base_address(scan.store().table().name()),

                                          scan.store().table().layout(), 1, scan.store().table().schema(scan.alias()),

                                          tuple_id_parent);

       }

    }();

    auto [inits_child, loads_child, _jumps_child] = [&](){

       if (needs_buffer_child) {

           return compile_load_sequential(buffer_child->schema(), empty_schema, buffer_child->base_address(),

                                          buffer_child->layout(), 1, buffer_child->schema(), tuple_id_child);

       } else {

           auto &scan = as<const ScanOperator>(M.child);

           return compile_load_sequential(schema_child, empty_schema, get_base_address(scan.store().table().name()),

                                          scan.store().table().layout(), 1, scan.store().table().schema(scan.alias()),

                                          tuple_id_child);

       }

    }();

    /* since structured bindings cannot be used in lambda capture */

    Block jumps_parent(std::move(_jumps_parent)), jumps_child(std::move(_jumps_child));


    /*----- Process both buffers together. -----*/

    setup();

    inits_parent.attach_to_current();

    inits_child.attach_to_current();

    U32x1 size_parent = needs_buffer_parent ? buffer_parent->size()

                                            : get_num_rows(as<const ScanOperator>(M.parent).store().table().name());

    U32x1 size_child = needs_buffer_child ? buffer_child->size()

                                          : get_num_rows(as<const ScanOperator>(M.child).store().table().name());

    WHILE (tuple_id_parent < size_parent and tuple_id_child < size_child) { // neither end reached

        loads_parent.attach_to_current();

        loads_child.attach_to_current();

        if constexpr (Predicated) {

            env.add_predicate(M.join.predicate());

            pipeline();

        } else {

            M_insist(CodeGenContext::Get().num_simd_lanes() == 1, "invalid number of SIMD lanes");

            IF (env.compile<_Boolx1>(M.join.predicate()).is_true_and_not_null()) { // predicate fulfilled

                pipeline();

            };

        }

        IF (child_smaller_equal()) {

            jumps_child.attach_to_current();

        } ELSE {

            jumps_parent.attach_to_current();

        };

    }

    teardown();

}


/*======================================================================================================================

 * Limit

 *====================================================================================================================*/


ConditionSet Limit::pre_condition(std::size_t child_idx, const std::tuple<const LimitOperator*>&)

{

     M_insist(child_idx == 0);


    ConditionSet pre_cond;


    /*----- Limit does not support SIMD. -----*/

    pre_cond.add_condition(NoSIMD());


    return pre_cond;

}


void Limit::execute(const Match<Limit> &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)

{

    std::optional<Block> teardown_block;

    std::optional<BlockUser> use_teardown;


    std::optional<Var<U32x1>> counter;

    /* default initialized to 0 */

    Global<U32x1> counter_backup;


    M.child->execute(

        /* setup=    */ setup_t(std::move(setup), [&](){

            counter.emplace(counter_backup);

            teardown_block.emplace("limit.teardown", true); // create block

            use_teardown.emplace(*teardown_block); // set block active s.t. it contains all following pipeline code

        }),

        /* pipeline= */ [&, pipeline=std::move(pipeline)](){

            M_insist(bool(teardown_block));

            M_insist(bool(counter));

            const uint32_t limit = M.limit.offset() + M.limit.limit();


            /*----- Abort pipeline, i.e. go to teardown code, if limit is exceeded. -----*/

            IF (*counter >= limit) {

                GOTO(*teardown_block);

            };


            /*----- Emit result if in bounds. -----*/

            if (M.limit.offset()) {

                IF (*counter >= uint32_t(M.limit.offset())) {

                    Wasm_insist(*counter < limit, "counter must not exceed limit");

                    pipeline();

                };

            } else {

                Wasm_insist(*counter < limit, "counter must not exceed limit");

                pipeline();

            }


            /*----- Update counter. -----*/

            *counter += 1U;

        },

        /* teardown= */ teardown_t::Make_Without_Parent([&, teardown=std::move(teardown)](){

            M_insist(bool(teardown_block));

            M_insist(bool(use_teardown));

            use_teardown.reset(); // deactivate block

            teardown_block.reset(); // emit block containing pipeline code into parent -> GOTO jumps here

            teardown(); // *before* own teardown code to *not* jump over it in case of another limit operator

            M_insist(bool(counter));

            counter_backup = *counter;

            counter.reset();

        })

    );

}


/*======================================================================================================================

 * Grouping combined with Join

 *====================================================================================================================*/


ConditionSet HashBasedGroupJoin::pre_condition(

    std::size_t child_idx,

    const std::tuple<const GroupingOperator*, const JoinOperator*, const Wildcard*, const Wildcard*>

        &partial_inner_nodes)

{

    ConditionSet pre_cond;


    /*----- Hash-based group-join can only be used if aggregates only depend on either build or probe relation. -----*/

    auto &grouping = *std::get<0>(partial_inner_nodes);

    for (auto &fn_expr : grouping.aggregates()) {

        M_insist(fn_expr.get().args.size() <= 1);

        if (fn_expr.get().args.size() == 1 and not is<const Designator>(fn_expr.get().args[0])) // XXX: expression with only designators from either child also valid

            return ConditionSet::Make_Unsatisfiable();

    }


    /*----- Hash-based group-join can only be used for binary joins on equi-predicates. -----*/

    auto &join = *std::get<1>(partial_inner_nodes);

    if (not join.predicate().is_equi())

        return ConditionSet::Make_Unsatisfiable();


    M_insist(child_idx < 2);

    if (child_idx == 0) {

        /*----- Decompose each clause of the join predicate of the form `A.x = B.y` into parts `A.x` and `B.y`. -----*/

        auto &build = *std::get<2>(partial_inner_nodes);

        const auto build_keys = decompose_equi_predicate(join.predicate(), build.schema()).first;


        /*----- Hash-based group-join can only be used if grouping and join (i.e. build) key match (ignoring order). -*/

        const auto num_grouping_keys = grouping.group_by().size();

        if (num_grouping_keys != build_keys.size()) // XXX: duplicated IDs are still a match but rejected here

            return ConditionSet::Make_Unsatisfiable();

        for (std::size_t i = 0; i < num_grouping_keys; ++i) {

            Schema::Identifier grouping_key(grouping.group_by()[i].first.get());

            if (not contains(build_keys, grouping_key))

                return ConditionSet::Make_Unsatisfiable();

        }

    }


    /*----- Hash-based group-join does not support SIMD. -----*/

    pre_cond.add_condition(NoSIMD());


    return pre_cond;

}


double HashBasedGroupJoin::cost(const Match<HashBasedGroupJoin> &M)

{

    return 1.5 * M.build.info().estimated_cardinality + 1.0 * M.probe.info().estimated_cardinality +

        1.0 * M.join.info().estimated_cardinality;

}


ConditionSet HashBasedGroupJoin::post_condition(const Match<HashBasedGroupJoin>&)

{

    ConditionSet post_cond;


    /*----- Hash-based group-join does not introduce predication (it is already handled by the hash table). -----*/

    post_cond.add_condition(Predicated(false));


    /*----- Hash-based group-join does not introduce SIMD. -----*/

    post_cond.add_condition(NoSIMD());


    return post_cond;

}


void HashBasedGroupJoin::execute(const Match<HashBasedGroupJoin> &M, setup_t setup, pipeline_t pipeline,

                                 teardown_t teardown)

{

    // TODO: determine setup

    const uint64_t AGGREGATES_SIZE_THRESHOLD_IN_BITS =

        M.use_in_place_values ? std::numeric_limits<uint64_t>::max() : 0;


    auto &C = Catalog::Get();

    const auto num_keys = M.grouping.group_by().size();


    /*----- Compute hash table schema and information about aggregates, especially AVG aggregates. -----*/

    Schema ht_schema;

    for (std::size_t i = 0; i < num_keys; ++i) {

        auto &e = M.grouping.schema()[i];

        ht_schema.add(e.id, e.type, e.constraints);

    }

    auto aggregates_info = compute_aggregate_info(M.grouping.aggregates(), M.grouping.schema(), num_keys);

    const auto &aggregates = aggregates_info.first;

    const auto &avg_aggregates = aggregates_info.second;

    bool needs_build_counter = false;

    uint64_t aggregates_size_in_bits = 0;

    for (auto &info : aggregates) {

        ht_schema.add(info.entry);

        aggregates_size_in_bits += info.entry.type->size();


        /* Add additional COUNT per group during build phase if COUNT or SUM dependent on probe relation occurs. */

        if (info.fnid == m::Function::FN_COUNT or info.fnid == m::Function::FN_SUM) {

            if (not info.args.empty()) {

                M_insist(info.args.size() == 1, "aggregate functions expect at most one argument");

                auto &des = as<const Designator>(*info.args[0]);

                Schema::Identifier arg(des.table_name.text, des.attr_name.text.assert_not_none());

                if (M.probe.schema().has(arg))

                    needs_build_counter = true;

            }

        }

    }

    if (needs_build_counter) {

        ht_schema.add(Schema::Identifier(C.pool("$build_counter")), Type::Get_Integer(Type::TY_Scalar, 8),

                      Schema::entry_type::NOT_NULLABLE);

        aggregates_size_in_bits += 64;

    }

    ht_schema.add(Schema::Identifier(C.pool("$probe_counter")), Type::Get_Integer(Type::TY_Scalar, 8),

                  Schema::entry_type::NOT_NULLABLE);

    aggregates_size_in_bits += 64;


    /*----- Decompose each clause of the join predicate of the form `A.x = B.y` into parts `A.x` and `B.y`. -----*/

    const auto [build_keys, probe_keys] = decompose_equi_predicate(M.join.predicate(), M.build.schema());

    M_insist(build_keys.size() == num_keys);


    /*----- Compute initial capacity of hash table. -----*/

    uint32_t initial_capacity = compute_initial_ht_capacity(M.grouping, M.load_factor);


    /*----- Create hash table for build relation. -----*/

    std::unique_ptr<HashTable> ht;

    std::vector<HashTable::index_t> key_indices(num_keys);

    std::iota(key_indices.begin(), key_indices.end(), 0);

    if (M.use_open_addressing_hashing) {

        if (aggregates_size_in_bits < AGGREGATES_SIZE_THRESHOLD_IN_BITS)

            ht = std::make_unique<GlobalOpenAddressingInPlaceHashTable>(ht_schema, std::move(key_indices),

                                                                        initial_capacity);

        else

            ht = std::make_unique<GlobalOpenAddressingOutOfPlaceHashTable>(ht_schema, std::move(key_indices),

                                                                           initial_capacity);

        if (M.use_quadratic_probing)

            as<OpenAddressingHashTableBase>(*ht).set_probing_strategy<QuadraticProbing>();

        else

            as<OpenAddressingHashTableBase>(*ht).set_probing_strategy<LinearProbing>();

    } else {

        ht = std::make_unique<GlobalChainedHashTable>(ht_schema, std::move(key_indices), initial_capacity);

    }


    std::optional<HashTable::entry_t> dummy;


    auto compile_aggregates = [&](HashTable::entry_t &entry, const Environment &env, const Schema &schema,

                                  bool build_phase) -> std::tuple<Block, Block, Block>

    {

        Block init_aggs("hash_based_group_join.init_aggs", false),

              update_aggs("hash_based_group_join.update_aggs", false),

              update_avg_aggs("hash_based_group_join.update_avg_aggs", false);

        for (auto &info : aggregates) {

            bool is_min = false;

            switch (info.fnid) {

                default:

                    M_unreachable("unsupported aggregate function");

                case m::Function::FN_MIN:

                    is_min = true; // set flag and delegate to MAX case

                case m::Function::FN_MAX: {

                    M_insist(info.args.size() == 1, "MIN and MAX aggregate functions expect exactly one argument");

                    auto &arg = as<const Designator>(*info.args[0]);

                    const bool bound = schema.has(Schema::Identifier(arg.table_name.text,

                                                                     arg.attr_name.text.assert_not_none()));


                    std::visit(overloaded {

                        [&]<sql_type _T>(HashTable::reference_t<_T> &&r) -> void

                        requires (not (std::same_as<_T, _Boolx1> or std::same_as<_T, NChar>)) {

                            using type = typename _T::type;

                            using T = PrimitiveExpr<type>;


                            if (build_phase) {

                                BLOCK_OPEN(init_aggs) {

                                    auto neutral = is_min ? T(std::numeric_limits<type>::max())

                                                          : T(std::numeric_limits<type>::lowest());

                                    if (bound) {

                                        auto _arg = env.compile(arg);

                                        auto [val_, is_null] = convert<_T>(_arg).split();

                                        T val(val_); // due to structured binding and lambda closure

                                        IF (is_null) {

                                            r.clone().set_value(neutral); // initialize with neutral element +inf or -inf

                                            if (info.entry.nullable())

                                                r.clone().set_null_bit(Boolx1(true)); // first value is NULL

                                        } ELSE {

                                            r.clone().set_value(val); // initialize with first value

                                            if (info.entry.nullable())

                                                r.clone().set_null_bit(Boolx1(false)); // first value is not NULL

                                        };

                                    } else {

                                        r.clone().set_value(neutral); // initialize with neutral element +inf or -inf

                                        if (info.entry.nullable())

                                            r.clone().set_null_bit(Boolx1(true)); // initialize with neutral element NULL

                                    }

                                }

                            }

                            if (not bound) {

                                r.discard();

                                return; // MIN and MAX does not change in phase when argument is unbound

                            }

                            BLOCK_OPEN(update_aggs) {

                                auto _arg = env.compile(arg);

                                _T _new_val = convert<_T>(_arg);

                                if (_new_val.can_be_null()) {

                                    auto [new_val_, new_val_is_null_] = _new_val.split();

                                    auto [old_min_max_, old_min_max_is_null] = _T(r.clone()).split();

                                    const Var<Boolx1> new_val_is_null(new_val_is_null_); // due to multiple uses


                                    auto chosen_r = Select(new_val_is_null, dummy->extract<_T>(info.entry.id), r.clone());

                                    if constexpr (std::floating_point<type>) {

                                        chosen_r.set_value(

                                            is_min ? min(old_min_max_, new_val_) // update old min with new value

                                                   : max(old_min_max_, new_val_) // update old max with new value

                                        ); // if new value is NULL, only dummy is written

                                    } else {

                                        const Var<T> new_val(new_val_),

                                                     old_min_max(old_min_max_); // due to multiple uses

                                        auto cmp = is_min ? new_val < old_min_max : new_val > old_min_max;

                                        chosen_r.set_value(

                                            Select(cmp,

                                                   new_val, // update to new value

                                                   old_min_max) // do not update

                                        ); // if new value is NULL, only dummy is written

                                    }

                                    r.set_null_bit(

                                        old_min_max_is_null and new_val_is_null // MIN/MAX is NULL iff all values are NULL

                                    );

                                } else {

                                    auto new_val_ = _new_val.insist_not_null();

                                    auto old_min_max_ = _T(r.clone()).insist_not_null();

                                    if constexpr (std::floating_point<type>) {

                                        r.set_value(

                                            is_min ? min(old_min_max_, new_val_) // update old min with new value

                                                   : max(old_min_max_, new_val_) // update old max with new value

                                        );

                                    } else {

                                        const Var<T> new_val(new_val_),

                                                     old_min_max(old_min_max_); // due to multiple uses

                                        auto cmp = is_min ? new_val < old_min_max : new_val > old_min_max;

                                        r.set_value(

                                            Select(cmp,

                                                   new_val, // update to new value

                                                   old_min_max) // do not update

                                        );

                                    }

                                    /* do not update NULL bit since it is already set to `false` */

                                }

                            }

                        },

                        []<sql_type _T>(HashTable::reference_t<_T>&&) -> void

                        requires std::same_as<_T,_Boolx1> or std::same_as<_T, NChar> {

                            M_unreachable("invalid type");

                        },

                        [](std::monostate) -> void { M_unreachable("invalid reference"); },

                    }, entry.extract(info.entry.id));

                    break;

                }

                case m::Function::FN_AVG: {

                    auto it = avg_aggregates.find(info.entry.id);

                    M_insist(it != avg_aggregates.end());

                    const auto &avg_info = it->second;

                    M_insist(avg_info.compute_running_avg,

                             "AVG aggregate may only occur for running average computations");

                    M_insist(info.args.size() == 1, "AVG aggregate function expects exactly one argument");

                    auto &arg = as<const Designator>(*info.args[0]);

                    const bool bound = schema.has(Schema::Identifier(arg.table_name.text,

                                                                     arg.attr_name.text.assert_not_none()));


                    auto r = entry.extract<_Doublex1>(info.entry.id);


                    if (build_phase) {

                        BLOCK_OPEN(init_aggs) {

                            if (bound) {

                                auto _arg = env.compile(arg);

                                auto [val_, is_null] = convert<_Doublex1>(_arg).split();

                                Doublex1 val(val_); // due to structured binding and lambda closure

                                IF (is_null) {

                                    r.clone().set_value(Doublex1(0.0)); // initialize with neutral element 0

                                    if (info.entry.nullable())

                                        r.clone().set_null_bit(Boolx1(true)); // first value is NULL

                                } ELSE {

                                    r.clone().set_value(val); // initialize with first value

                                    if (info.entry.nullable())

                                        r.clone().set_null_bit(Boolx1(false)); // first value is not NULL

                                };

                            } else {

                                r.clone().set_value(Doublex1(0.0)); // initialize with neutral element 0

                                if (info.entry.nullable())

                                    r.clone().set_null_bit(Boolx1(true)); // initialize with neutral element NULL

                            }

                        }

                    }

                    if (not bound) {

                        r.discard();

                        break; // AVG does not change in phase when argument is unbound

                    }

                    BLOCK_OPEN(update_avg_aggs) {

                        /* Compute AVG as iterative mean as described in Knuth, The Art of Computer Programming

                         * Vol 2, section 4.2.2. */

                        auto _arg = env.compile(arg);

                        _Doublex1 _new_val = convert<_Doublex1>(_arg);

                        if (_new_val.can_be_null()) {

                            auto [new_val, new_val_is_null_] = _new_val.split();

                            auto [old_avg_, old_avg_is_null] = _Doublex1(r.clone()).split();

                            const Var<Boolx1> new_val_is_null(new_val_is_null_); // due to multiple uses

                            const Var<Doublex1> old_avg(old_avg_); // due to multiple uses


                            auto delta_absolute = new_val - old_avg;

                            auto running_count = _I64x1(entry.get<_I64x1>(avg_info.running_count)).insist_not_null();

                            auto delta_relative = delta_absolute / running_count.to<double>();


                            auto chosen_r = Select(new_val_is_null, dummy->extract<_Doublex1>(info.entry.id), r.clone());

                            chosen_r.set_value(

                                old_avg + delta_relative // update old average with new value

                            ); // if new value is NULL, only dummy is written

                            r.set_null_bit(

                                old_avg_is_null and new_val_is_null // AVG is NULL iff all values are NULL

                            );

                        } else {

                            auto new_val = _new_val.insist_not_null();

                            auto old_avg_ = _Doublex1(r.clone()).insist_not_null();

                            const Var<Doublex1> old_avg(old_avg_); // due to multiple uses


                            auto delta_absolute = new_val - old_avg;

                            auto running_count = _I64x1(entry.get<_I64x1>(avg_info.running_count)).insist_not_null();

                            auto delta_relative = delta_absolute / running_count.to<double>();

                            r.set_value(

                                old_avg + delta_relative // update old average with new value

                            );

                            /* do not update NULL bit since it is already set to `false` */

                        }

                    }

                    break;

                }

                case m::Function::FN_SUM: {

                    M_insist(info.args.size() == 1, "SUM aggregate function expects exactly one argument");

                    auto &arg = as<const Designator>(*info.args[0]);

                    const bool bound = schema.has(Schema::Identifier(arg.table_name.text,

                                                                     arg.attr_name.text.assert_not_none()));


                    std::visit(overloaded {

                        [&]<sql_type _T>(HashTable::reference_t<_T> &&r) -> void

                        requires (not (std::same_as<_T, _Boolx1> or std::same_as<_T, NChar>)) {

                            using type = typename _T::type;

                            using T = PrimitiveExpr<type>;


                            if (build_phase) {

                                BLOCK_OPEN(init_aggs) {

                                    if (bound) {

                                        auto _arg = env.compile(arg);

                                        auto [val_, is_null] = convert<_T>(_arg).split();

                                        T val(val_); // due to structured binding and lambda closure

                                        IF (is_null) {

                                            r.clone().set_value(T(type(0))); // initialize with neutral element 0

                                            if (info.entry.nullable())

                                                r.clone().set_null_bit(Boolx1(true)); // first value is NULL

                                        } ELSE {

                                            r.clone().set_value(val); // initialize with first value

                                            if (info.entry.nullable())

                                                r.clone().set_null_bit(Boolx1(false)); // first value is not NULL

                                        };

                                    } else {

                                        r.clone().set_value(T(type(0))); // initialize with neutral element 0

                                        if (info.entry.nullable())

                                            r.clone().set_null_bit(Boolx1(true)); // initialize with neutral element NULL

                                    }

                                }

                            }

                            if (not bound) {

                                r.discard();

                                return; // SUM may later be multiplied with group counter but does not change here

                            }

                            BLOCK_OPEN(update_aggs) {

                                auto _arg = env.compile(arg);

                                _T _new_val = convert<_T>(_arg);

                                if (_new_val.can_be_null()) {

                                    auto [new_val, new_val_is_null_] = _new_val.split();

                                    auto [old_sum, old_sum_is_null] = _T(r.clone()).split();

                                    const Var<Boolx1> new_val_is_null(new_val_is_null_); // due to multiple uses


                                    auto chosen_r = Select(new_val_is_null, dummy->extract<_T>(info.entry.id), r.clone());

                                    chosen_r.set_value(

                                        old_sum + new_val // add new value to old sum

                                    ); // if new value is NULL, only dummy is written

                                    r.set_null_bit(

                                        old_sum_is_null and new_val_is_null // SUM is NULL iff all values are NULL

                                    );

                                } else {

                                    auto new_val = _new_val.insist_not_null();

                                    auto old_sum = _T(r.clone()).insist_not_null();

                                    r.set_value(

                                        old_sum + new_val // add new value to old sum

                                    );

                                    /* do not update NULL bit since it is already set to `false` */

                                }

                            }

                        },

                        []<sql_type _T>(HashTable::reference_t<_T>&&) -> void

                        requires std::same_as<_T,_Boolx1> or std::same_as<_T, NChar> {

                            M_unreachable("invalid type");

                        },

                        [](std::monostate) -> void { M_unreachable("invalid reference"); },

                    }, entry.extract(info.entry.id));

                    break;

                }

                case m::Function::FN_COUNT: {

                    M_insist(info.args.size() <= 1, "COUNT aggregate function expects at most one argument");


                    auto r = entry.get<_I64x1>(info.entry.id); // do not extract to be able to access for AVG case


                    if (info.args.empty()) {

                        if (not build_phase) {

                            r.discard();

                            break; // COUNT(*) will later be multiplied with probe counter but only changes in build phase

                        }

                        BLOCK_OPEN(init_aggs) {

                            r.clone() = _I64x1(1); // initialize with 1 (for first value)

                        }

                        BLOCK_OPEN(update_aggs) {

                            auto old_count = _I64x1(r.clone()).insist_not_null();

                            r.set_value(

                                old_count + int64_t(1) // increment old count by 1

                            );

                            /* do not update NULL bit since it is already set to `false` */

                        }

                    } else {

                        auto &arg = as<const Designator>(*info.args[0]);

                        const bool bound = schema.has(Schema::Identifier(arg.table_name.text,

                                                                         arg.attr_name.text.assert_not_none()));


                        if (build_phase) {

                            BLOCK_OPEN(init_aggs) {

                                if (bound) {

                                    auto _arg = env.compile(arg);

                                    I64x1 new_val_not_null =

                                        can_be_null(_arg) ? not_null(_arg).to<int64_t>()

                                                          : (discard(_arg), I64x1(1)); // discard since no use

                                    r.clone() = _I64x1(new_val_not_null); // initialize with 1 iff first value is present

                                } else {

                                    r.clone() = _I64x1(0); // initialize with neutral element 0

                                }

                            }

                        }

                        if (not bound) {

                            r.discard();

                            break; // COUNT may later be multiplied with group counter but does not change here

                        }

                        BLOCK_OPEN(update_aggs) {

                            auto _arg = env.compile(arg);

                            I64x1 new_val_not_null =

                                can_be_null(_arg) ? not_null(_arg).to<int64_t>()

                                                  : (discard(_arg), I64x1(1)); // discard since no use

                            auto old_count = _I64x1(r.clone()).insist_not_null();

                            r.set_value(

                                old_count + new_val_not_null // increment old count by 1 iff new value is present

                            );

                            /* do not update NULL bit since it is already set to `false` */

                        }

                    }

                    break;

                }

            }

        }

        return { std::move(init_aggs), std::move(update_aggs), std::move(update_avg_aggs) };

    };


    /*----- Create function for build child. -----*/

    FUNCTION(hash_based_group_join_build_child_pipeline, void(void)) // create function for pipeline

    {

        auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function


        M.children[0]->execute(

            /* setup=    */ setup_t::Make_Without_Parent([&](){

                ht->setup();

                ht->set_high_watermark(M.load_factor);

                dummy.emplace(ht->dummy_entry()); // create dummy slot to ignore NULL values in aggregate computations

            }),

            /* pipeline= */ [&](){

                M_insist(bool(dummy));

                const auto &env = CodeGenContext::Get().env();


                std::optional<Boolx1> build_key_not_null;

                for (auto &build_key : build_keys) {

                    auto val = env.get(build_key);

                    if (build_key_not_null)

                        build_key_not_null.emplace(*build_key_not_null and not_null(val));

                    else

                        build_key_not_null.emplace(not_null(val));

                }

                M_insist(bool(build_key_not_null));

                IF (*build_key_not_null) { // TODO: predicated version

                    /*----- Insert key if not yet done. -----*/

                    std::vector<SQL_t> key;

                    for (auto &build_key : build_keys)

                        key.emplace_back(env.get(build_key));

                    auto [entry, inserted] = ht->try_emplace(std::move(key));


                    /*----- Compile aggregates. -----*/

                    auto t = compile_aggregates(entry, env, M.build.schema(), /* build_phase= */ true);

                    auto &init_aggs = std::get<0>(t);

                    auto &update_aggs = std::get<1>(t);

                    auto &update_avg_aggs = std::get<2>(t);


                    /*----- Add group counters to compiled aggregates. -----*/

                    if (needs_build_counter) {

                        auto r = entry.extract<_I64x1>(C.pool("$build_counter"));

                        BLOCK_OPEN(init_aggs) {

                            r.clone() = _I64x1(1); // initialize with 1 (for first value)

                        }

                        BLOCK_OPEN(update_aggs) {

                            auto old_count = _I64x1(r.clone()).insist_not_null();

                            r.set_value(

                                old_count + int64_t(1) // increment old count by 1

                            );

                            /* do not update NULL bit since it is already set to `false` */

                        }

                    }

                    BLOCK_OPEN(init_aggs) {

                        auto r = entry.extract<_I64x1>(C.pool("$probe_counter"));

                        r = _I64x1(0); // initialize with neutral element 0

                    }


                    /*----- If group has been inserted, initialize aggregates. Otherwise, update them. -----*/

                    IF (inserted) {

                        init_aggs.attach_to_current();

                    } ELSE {

                        update_aggs.attach_to_current();

                        update_avg_aggs.attach_to_current(); // after others to ensure that running count is incremented before

                    };

                };

            },

            /* teardown= */ teardown_t::Make_Without_Parent([&](){ ht->teardown(); })

        );

    }

    hash_based_group_join_build_child_pipeline(); // call build child function


        /*----- Create function for probe child. -----*/

    FUNCTION(hash_based_group_join_probe_child_pipeline, void(void)) // create function for pipeline

    {

        auto S = CodeGenContext::Get().scoped_environment(); // create scoped environment for this function


        M.children[1]->execute(

            /* setup=    */ setup_t::Make_Without_Parent([&](){

                ht->setup();

                dummy.emplace(ht->dummy_entry()); // create dummy slot to ignore NULL values in aggregate computations

            }),

            /* pipeline= */ [&](){

                M_insist(bool(dummy));

                const auto &env = CodeGenContext::Get().env();


                /* TODO: may check for NULL on probe keys as well, branching + predicated version */

                /*----- Probe with probe key. -----*/

                std::vector<SQL_t> key;

                for (auto &probe_key : probe_keys)

                    key.emplace_back(env.get(probe_key));

                auto [entry, found] = ht->find(std::move(key));


                /*----- Compile aggregates. -----*/

                auto t = compile_aggregates(entry, env, M.probe.schema(), /* build_phase= */ false);

                auto &init_aggs = std::get<0>(t);

                auto &update_aggs = std::get<1>(t);

                auto &update_avg_aggs = std::get<2>(t);


                /*----- Add probe counter to compiled aggregates. -----*/

                BLOCK_OPEN(update_aggs) {

                    auto r = entry.extract<_I64x1>(C.pool("$probe_counter"));

                    auto old_count = _I64x1(r.clone()).insist_not_null();

                    r.set_value(

                        old_count + int64_t(1) // increment old count by 1

                    );

                    /* do not update NULL bit since it is already set to `false` */

                }


                /*----- If group has been inserted, initialize aggregates. Otherwise, update them. -----*/

                M_insist(init_aggs.empty(), "aggregates must be initialized in build phase");

                IF (found) {

                    update_aggs.attach_to_current();

                    update_avg_aggs.attach_to_current(); // after others to ensure that running count is incremented before

                };

            },

            /* teardown= */ teardown_t::Make_Without_Parent([&](){ ht->teardown(); })

        );

    }

    hash_based_group_join_probe_child_pipeline(); // call probe child function


    auto &env = CodeGenContext::Get().env();


    /*----- Process each computed group. -----*/

    setup_t(std::move(setup), [&](){ ht->setup(); })();

    ht->for_each([&, pipeline=std::move(pipeline)](HashTable::const_entry_t entry){

        /*----- Check whether probe match was found. -----*/

        I64x1 probe_counter = _I64x1(entry.get<_I64x1>(C.pool("$probe_counter"))).insist_not_null();

        IF (probe_counter != int64_t(0)) {

            /*----- Compute key schema to detect duplicated keys. -----*/

            Schema key_schema;

            for (std::size_t i = 0; i < num_keys; ++i) {

                auto &e = M.grouping.schema()[i];

                key_schema.add(e.id, e.type, e.constraints);

            }


            /*----- Add computed group tuples to current environment. ----*/

            for (auto &e : M.grouping.schema().deduplicate()) {

                try {

                    key_schema.find(e.id);

                } catch (invalid_argument&) {

                    continue; // skip duplicated keys since they must not be used afterwards

                }


                if (auto it = avg_aggregates.find(e.id);

                    it != avg_aggregates.end() and not it->second.compute_running_avg)

                { // AVG aggregates which is not yet computed, divide computed sum with computed count

                    auto &avg_info = it->second;

                    auto sum = std::visit(overloaded {

                        [&]<sql_type T>(HashTable::const_reference_t<T> &&r) -> _Doublex1

                        requires (std::same_as<T, _I64x1> or std::same_as<T, _Doublex1>) {

                            return T(r).template to<double>();

                        },

                        [](auto&&) -> _Doublex1 { M_unreachable("invalid type"); },

                        [](std::monostate&&) -> _Doublex1 { M_unreachable("invalid reference"); },

                    }, entry.get(avg_info.sum));

                    auto count = _I64x1(entry.get<_I64x1>(avg_info.running_count)).insist_not_null().to<double>();

                    auto avg = sum / count; // no need to multiply with group counter as the factor would not change the fraction

                    if (avg.can_be_null()) {

                        _Var<Doublex1> var(avg); // introduce variable s.t. uses only load from it

                        env.add(e.id, var);

                    } else {

                        /* introduce variable w/o NULL bit s.t. uses only load from it */

                        Var<Doublex1> var(avg.insist_not_null());

                        env.add(e.id, _Doublex1(var));

                    }

                } else { // part of key or already computed aggregate (without multiplication with group counter)

                    std::visit(overloaded {

                        [&]<typename T>(HashTable::const_reference_t<Expr<T>> &&r) -> void {

                            Expr<T> value = r;


                            auto pred = [&e](const auto &info) -> bool { return info.entry.id == e.id; };

                            if (auto it = std::find_if(aggregates.cbegin(), aggregates.cend(), pred);

                                it != aggregates.cend())

                            { // aggregate

                                /* For COUNT and SUM, multiply current aggregate value with respective group counter

                                 * since only tuples in phase in which argument is bound are counted/summed up. */

                                if (it->args.empty()) {

                                    M_insist(it->fnid == m::Function::FN_COUNT,

                                             "only COUNT aggregate function may have no argument");

                                    I64x1 probe_counter =

                                        _I64x1(entry.get<_I64x1>(C.pool("$probe_counter"))).insist_not_null();

                                    PrimitiveExpr<T> count = value.insist_not_null() * probe_counter.to<T>();

                                    Var<PrimitiveExpr<T>> var(count); // introduce variable s.t. uses only load from it

                                    env.add(e.id, Expr<T>(var));

                                    return; // next group tuple entry

                                } else {

                                    M_insist(it->args.size() == 1, "aggregate functions expect at most one argument");

                                    auto &des = as<const Designator>(*it->args[0]);

                                    Schema::Identifier arg(des.table_name.text, des.attr_name.text.assert_not_none());

                                    if (it->fnid == m::Function::FN_COUNT or it->fnid == m::Function::FN_SUM) {

                                        if (M.probe.schema().has(arg)) {

                                            I64x1 build_counter =

                                                _I64x1(entry.get<_I64x1>(C.pool("$build_counter"))).insist_not_null();

                                            auto agg = value * build_counter.to<T>();

                                            if (agg.can_be_null()) {

                                                Var<Expr<T>> var(agg); // introduce variable s.t. uses only load from it

                                                env.add(e.id, var);

                                            } else {

                                                /* introduce variable w/o NULL bit s.t. uses only load from it */

                                                Var<PrimitiveExpr<T>> var(agg.insist_not_null());

                                                env.add(e.id, Expr<T>(var));

                                            }

                                        } else {

                                            M_insist(M.build.schema().has(arg),

                                                     "argument ID must occur in either child schema");

                                            I64x1 probe_counter =

                                                _I64x1(entry.get<_I64x1>(C.pool("$probe_counter"))).insist_not_null();

                                            auto agg = value * probe_counter.to<T>();

                                            if (agg.can_be_null()) {

                                                Var<Expr<T>> var(agg); // introduce variable s.t. uses only load from it

                                                env.add(e.id, var);

                                            } else {

                                                /* introduce variable w/o NULL bit s.t. uses only load from it */

                                                Var<PrimitiveExpr<T>> var(agg.insist_not_null());

                                                env.add(e.id, Expr<T>(var));

                                            }

                                        }

                                        return; // next group tuple entry

                                    }

                                }

                            }


                            /* fallthrough: part of key or correctly computed aggregate */

                            if (value.can_be_null()) {

                                Var<Expr<T>> var(value); // introduce variable s.t. uses only load from it

                                env.add(e.id, var);

                            } else {

                                /* introduce variable w/o NULL bit s.t. uses only load from it */

                                Var<PrimitiveExpr<T>> var(value.insist_not_null());

                                env.add(e.id, Expr<T>(var));

                            }

                        },

                        [&](HashTable::const_reference_t<_Boolx1> &&r) -> void {

#ifndef NDEBUG

                            auto pred = [&e](const auto &info) -> bool { return info.entry.id == e.id; };

                            M_insist(std::find_if(aggregates.cbegin(), aggregates.cend(), pred) == aggregates.cend(),

                                     "booleans must not be the result of aggregate functions");

#endif

                            _Boolx1 value = r;

                            if (value.can_be_null()) {

                                _Var<Boolx1> var(value); // introduce variable s.t. uses only load from it

                                env.add(e.id, var);

                            } else {

                                /* introduce variable w/o NULL bit s.t. uses only load from it */

                                Var<Boolx1> var(value.insist_not_null());

                                env.add(e.id, _Boolx1(var));

                            }

                        },

                        [&](HashTable::const_reference_t<NChar> &&r) -> void {

#ifndef NDEBUG

                            auto pred = [&e](const auto &info) -> bool { return info.entry.id == e.id; };

                            M_insist(std::find_if(aggregates.cbegin(), aggregates.cend(), pred) == aggregates.cend(),

                                     "strings must not be the result of aggregate functions");

#endif

                            NChar value(r);

                            Var<Ptr<Charx1>> var(value.val()); // introduce variable s.t. uses only load from it

                            env.add(e.id, NChar(var, value.can_be_null(), value.length(),

                                                value.guarantees_terminating_nul()));

                        },

                        [](std::monostate&&) -> void { M_unreachable("invalid reference"); },

                    }, entry.get(e.id)); // do not extract to be able to access for not-yet-computed AVG aggregates

                }

            }


            /*----- Resume pipeline. -----*/

            pipeline();

        };

    });

    teardown_t(std::move(teardown), [&](){ ht->teardown(); })();

}


/*======================================================================================================================

 * Match<T>::print()

 *====================================================================================================================*/


struct print_info

{

    const Operator &op;


    friend std::ostream & operator<<(std::ostream &out, const print_info &info) {

        if (info.op.has_info())

            out << " <" << info.op.info().estimated_cardinality << '>';

        return out;

    }

};


void Match<m::wasm::NoOp>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::NoOp" << print_info(this->noop) << " (cumulative cost " << cost() << ')';

    this->child->print(out, level + 1);

}


template<bool SIMDfied>

void Match<m::wasm::Callback<SIMDfied>>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::Callback with " << this->result_set_window_size << " tuples result set "

                       << this->callback.schema() << print_info(this->callback)

                       << " (cumulative cost " << cost() << ')';

    this->child->print(out, level + 1);

}


template<bool SIMDfied>

void Match<m::wasm::Print<SIMDfied>>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::Print with " << this->result_set_window_size << " tuples result set "

                       << this->print_op.schema() << print_info(this->print_op)

                       << " (cumulative cost " << cost() << ')';

    this->child->print(out, level + 1);

}


template<bool SIMDfied>

void Match<m::wasm::Scan<SIMDfied>>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << (SIMDfied ? "wasm::SIMDScan(" : "wasm::Scan(") << this->scan.alias() << ") ";

    if (this->buffer_factory_ and this->scan.schema().drop_constants().deduplicate().num_entries())

        out << "with " << this->buffer_num_tuples_ << " tuples output buffer ";

    out << this->scan.schema() << print_info(this->scan) << " (cumulative cost " << cost() << ')';

}


template<idx::IndexMethod IndexMethod>

void Match<m::wasm::IndexScan<IndexMethod>>::print(std::ostream &out, unsigned level) const

{

    if (IndexMethod == idx::IndexMethod::Array)

        indent(out, level) << "wasm::ArrayIndexScan(";

    else if (IndexMethod == idx::IndexMethod::Rmi)

        indent(out, level) << "wasm::RecursiveModelIndexScan(";

    else

        M_unreachable("unknown index");


    if (options::index_scan_strategy == option_configs::IndexScanStrategy::COMPILATION) {

        out << "Compilation[";

        if (options::index_scan_compilation_strategy == option_configs::IndexScanCompilationStrategy::CALLBACK)

            out << "Callback";

        else if (options::index_scan_compilation_strategy == option_configs::IndexScanCompilationStrategy::EXPOSED_MEMORY)

            out << "ExposedMemory";

        else

            M_unreachable("unknown compilation strategy");

    } else if (options::index_scan_strategy == option_configs::IndexScanStrategy::INTERPRETATION) {

        out << "Interpretation[";

        if (options::index_scan_materialization_strategy == option_configs::IndexScanMaterializationStrategy::INLINE)

            out << "Inline";

        else if (options::index_scan_materialization_strategy == option_configs::IndexScanMaterializationStrategy::MEMORY)

            out << "Memory";

        else

            M_unreachable("unknown materialization strategy");

    } else if (options::index_scan_strategy == option_configs::IndexScanStrategy::HYBRID) {

        out << "Hybrid[";

        if (options::index_scan_materialization_strategy == option_configs::IndexScanMaterializationStrategy::INLINE)

            out << "Inline,";

        else if (options::index_scan_materialization_strategy == option_configs::IndexScanMaterializationStrategy::MEMORY)

            out << "Memory,";

        else

            M_unreachable("unknown materialization strategy");

        if (options::index_scan_compilation_strategy == option_configs::IndexScanCompilationStrategy::CALLBACK)

            out << "Callback";

        else if (options::index_scan_compilation_strategy == option_configs::IndexScanCompilationStrategy::EXPOSED_MEMORY)

            out << "ExposedMemory";

        else

            M_unreachable("unknown compilation strategy");

    } else {

        M_unreachable("unknown strategy");

    }


    out << "], " << this->scan.alias() << ", " << this->filter.filter() << ") ";

    if (this->buffer_factory_ and this->scan.schema().drop_constants().deduplicate().num_entries())

        out << "with " << this->buffer_num_tuples_ << " tuples output buffer ";

    out << this->scan.schema() << print_info(this->scan) << " (cumulative cost " << cost() << ')';

}


template<bool Predicated>

void Match<m::wasm::Filter<Predicated>>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::" << (Predicated ? "Predicated" : "Branching") << "Filter ";

    if (this->buffer_factory_ and this->filter.schema().drop_constants().deduplicate().num_entries())

        out << "with " << this->buffer_num_tuples_ << " tuples output buffer ";

    out << this->filter.schema() << print_info(this->filter) << " (cumulative cost " << cost() << ')';

    this->child->print(out, level + 1);

}


void Match<m::wasm::LazyDisjunctiveFilter>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::LazyDisjunctiveFilter ";

    if (this->buffer_factory_ and this->filter.schema().drop_constants().deduplicate().num_entries())

        out << "with " << this->buffer_num_tuples_ << " tuples output buffer ";

    const cnf::Clause &clause = this->filter.filter()[0];

    for (auto it = clause.cbegin(); it != clause.cend(); ++it) {

        if (it != clause.cbegin()) out << " → ";

        out << *it;

    }

    out << ' ' << this->filter.schema() << print_info(this->filter) << " (cumulative cost " << cost() << ')';

    this->child->print(out, level + 1);

}


void Match<m::wasm::Projection>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::Projection ";

    if (this->buffer_factory_ and this->projection.schema().drop_constants().deduplicate().num_entries())

        out << "with " << this->buffer_num_tuples_ << " tuples output buffer ";

    out << this->projection.schema() << print_info(this->projection) << " (cumulative cost " << cost() << ')';

    if (this->child)

        this->child->get()->print(out, level + 1);

}


void Match<m::wasm::HashBasedGrouping>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::HashBasedGrouping " << this->grouping.schema() << print_info(this->grouping)

                       << " (cumulative cost " << cost() << ')';

    this->child->print(out, level + 1);

}


void Match<m::wasm::OrderedGrouping>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::OrderedGrouping " << this->grouping.schema() << print_info(this->grouping)

                       << " (cumulative cost " << cost() << ')';

    this->child->print(out, level + 1);

}


void Match<m::wasm::Aggregation>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::Aggregation " << this->aggregation.schema() << print_info(this->aggregation)

                       << " (cumulative cost " << cost() << ')';

    this->child->print(out, level + 1);

}


template<bool CmpPredicated>

void Match<m::wasm::Quicksort<CmpPredicated>>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::" << (CmpPredicated ? "Predicated" : "") << "Quicksort " << this->sorting.schema()

                       << print_info(this->sorting) << " (cumulative cost " << cost() << ')';

    this->child->print(out, level + 1);

}


void Match<m::wasm::NoOpSorting>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::NoOpSorting" << print_info(this->sorting) << " (cumulative cost " << cost() << ')';

    this->child->print(out, level + 1);

}


template<bool Predicated>

void Match<m::wasm::NestedLoopsJoin<Predicated>>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::" << (Predicated ? "Predicated" : "") << "NestedLoopsJoin ";

    if (this->buffer_factory_ and this->join.schema().drop_constants().deduplicate().num_entries())

        out << "with " << this->buffer_num_tuples_ << " tuples output buffer ";

    out << this->join.schema() << print_info(this->join) << " (cumulative cost " << cost() << ')';


    ++level;

    std::size_t i = this->children.size();

    while (i--) {

        const m::wasm::MatchBase &child = *this->children[i];

        indent(out, level) << i << ". input";

        child.print(out, level + 1);

    }

}


template<bool Unique, bool Predicated>

void Match<m::wasm::SimpleHashJoin<Unique, Predicated>>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::" << (Predicated ? "Predicated" : "") << "SimpleHashJoin";

    if (Unique) out << " on UNIQUE key ";

    if (this->buffer_factory_ and this->join.schema().drop_constants().deduplicate().num_entries())

        out << "with " << this->buffer_num_tuples_ << " tuples output buffer ";

    out << this->join.schema() << print_info(this->join) << " (cumulative cost " << cost() << ')';


    ++level;

    const m::wasm::MatchBase &build = *this->children[0];

    const m::wasm::MatchBase &probe = *this->children[1];

    indent(out, level) << "probe input";

    probe.print(out, level + 1);

    indent(out, level) << "build input";

    build.print(out, level + 1);

}


template<bool SortLeft, bool SortRight, bool Predicated, bool CmpPredicated>

void Match<m::wasm::SortMergeJoin<SortLeft, SortRight, Predicated, CmpPredicated>>::print(std::ostream &out,

                                                                                          unsigned level) const

{

    indent(out, level) << "wasm::" << (Predicated ? "Predicated" : "") << "SortMergeJoin ";

    switch ((unsigned(SortLeft) << 1) | unsigned(SortRight))

    {

        case 0: out << "pre-sorted "; break;

        case 1: out << "sorting right input " << (CmpPredicated ? "predicated " : ""); break;

        case 2: out << "sorting left input " << (CmpPredicated ? "predicated " : ""); break;

        case 3: out << "sorting both inputs " << (CmpPredicated ? "predicated " : ""); break;

    }

    const bool needs_buffer_parent = not is<const ScanOperator>(this->parent) or SortLeft;

    const bool needs_buffer_child  = not is<const ScanOperator>(this->child) or SortRight;

    if (needs_buffer_parent and needs_buffer_child)

        out << "and materializing both inputs ";

    else if (needs_buffer_parent)

        out << "and materializing left input ";

    else if (needs_buffer_child)

        out << "and materializing right input ";

    out << this->join.schema() << print_info(this->join) << " (cumulative cost " << cost() << ')';


    ++level;

    const m::wasm::MatchBase &left  = *this->children[0];

    const m::wasm::MatchBase &right = *this->children[1];

    indent(out, level) << "right input";

    right.print(out, level + 1);

    indent(out, level) << "left input";

    left.print(out, level + 1);

}


void Match<m::wasm::Limit>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::Limit " << this->limit.schema() << print_info(this->limit)

                       << " (cumulative cost " << cost() << ')';

    this->child->print(out, level + 1);

}


void Match<m::wasm::HashBasedGroupJoin>::print(std::ostream &out, unsigned level) const

{

    indent(out, level) << "wasm::HashBasedGroupJoin ";

    if (this->buffer_factory_ and this->grouping.schema().drop_constants().deduplicate().num_entries())

        out << "with " << this->buffer_num_tuples_ << " tuples output buffer ";

    out << this->grouping.schema() << print_info(this->grouping) << " (cumulative cost " << cost() << ')';


    ++level;

    const m::wasm::MatchBase &build = *this->children[0];

    const m::wasm::MatchBase &probe = *this->children[1];

    indent(out, level) << "probe input";

    probe.print(out, level + 1);

    indent(out, level) << "build input";

    build.print(out, level + 1);

}


/*======================================================================================================================

 * ThePreOrderMatchBaseVisitor, ThePostOrderMatchBaseVisitor

 *====================================================================================================================*/


namespace {


template<bool C, bool PreOrder>

struct recursive_matchbase_visitor : TheRecursiveMatchBaseVisitorBase<C>

{

    using super = TheRecursiveMatchBaseVisitorBase<C>;

    template<typename T> using Const = typename super::template Const<T>;

    using callback_t = std::conditional_t<C, ConstMatchBaseVisitor, MatchBaseVisitor>;


    private:

    callback_t &callback_;


    public:

    recursive_matchbase_visitor(callback_t &callback) : callback_(callback) { }


    using super::operator();

#define DECLARE(CLASS) \

    void operator()(Const<CLASS> &M) override { \

        if constexpr (PreOrder) try { callback_(M); } catch (visit_skip_subtree) { return; } \

        super::operator()(M); \

        if constexpr (not PreOrder) callback_(M); \

    }

M_WASM_MATCH_LIST(DECLARE)

#undef DECLARE

};


}


template<bool C>

void ThePreOrderMatchBaseVisitor<C>::operator()(Const<MatchBase> &M)

{

    recursive_matchbase_visitor<C, /* PreOrder= */ true>{*this}(M);

}


template<bool C>

void ThePostOrderMatchBaseVisitor<C>::operator()(Const<MatchBase> &M)

{

    recursive_matchbase_visitor<C, /* PreOrder= */ false>{*this}(M);

}


/*======================================================================================================================

 * Explicit template instantiations

 *====================================================================================================================*/


#define INSTANTIATE(CLASS) \

    template struct m::wasm::CLASS; \

    template struct m::Match<m::wasm::CLASS>;

M_WASM_OPERATOR_LIST_TEMPLATED(INSTANTIATE)

#undef INSTANTIATE


template struct m::wasm::ThePreOrderMatchBaseVisitor<true>;

template struct m::wasm::ThePostOrderMatchBaseVisitor<true>;

AST.hpp

Catalog.hpp

__attribute__
__attribute__((constructor(202))) static void register_interpreter()
Definition: Interpreter.cpp:1657

Interpreter.hpp

id
#define id(X)

DECLARE
#define DECLARE(CLASS)
Definition: PhysicalOptimizer.hpp:395

WasmAlgo.hpp

M_insist_no_ternary_logic
#define M_insist_no_ternary_logic()
Definition: WasmDSL.hpp:45

Wasm_insist
#define Wasm_insist(...)
Definition: WasmDSL.hpp:373

WasmMacro.hpp

ELSE
#define ELSE
Definition: WasmMacro.hpp:24

WHILE
#define WHILE(...)
Definition: WasmMacro.hpp:43

BLOCK
#define BLOCK(...)
Definition: WasmMacro.hpp:15

PARAMETER
#define PARAMETER(IDX)
Definition: WasmMacro.hpp:20

IF
#define IF(COND)
Definition: WasmMacro.hpp:23

FUNCTION
#define FUNCTION(NAME, TYPE)
Definition: WasmMacro.hpp:17

BLOCK_OPEN
#define BLOCK_OPEN(BLK)
Definition: WasmMacro.hpp:8

get_valid_bound
std::pair< const Constant &, bool > get_valid_bound(const ast::Expr &expr)
Given an Expr expr representing a valid bound, returns a pair consiting of a constant and a boolean f...
Definition: WasmOperator.cpp:1033

index_scan_resolve_attribute_type
void index_scan_resolve_attribute_type(const Match< IndexScan< IndexMethod > > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Resolves the attribute type and calls the appropriate codegen function.
Definition: WasmOperator.cpp:2147

index_scan_resolve_strategy
void index_scan_resolve_strategy(const Index &index, const index_scan_bounds_t &bounds, const Match< IndexScan< IndexMethod > > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Resolves the index scan strategy and calls the appropriate codegen function.
Definition: WasmOperator.cpp:2104

get_array_index_base_address
Ptr< void > get_array_index_base_address(const ThreadSafePooledString &table_name, const ThreadSafePooledString &attr_name)
Returns a pointer to the beginning of array index for table table_name and attribute attr_name.
Definition: WasmOperator.cpp:987

decompose_equi_predicate
std::pair< std::vector< Schema::Identifier >, std::vector< Schema::Identifier > > decompose_equi_predicate(const cnf::CNF &cnf, const Schema &schema_left)
Decompose the equi-predicate cnf, i.e.
Definition: WasmOperator.cpp:940

compute_initial_ht_capacity
uint32_t compute_initial_ht_capacity(const Operator &op, double load_factor)
Computes the initial hash table capacity for op.
Definition: WasmOperator.cpp:996

RESOLVE_INDEX_METHOD
#define RESOLVE_INDEX_METHOD(ATTRTYPE, SQLTYPE)

write_result_set
void write_result_set(const Schema &schema, const DataLayoutFactory &factory, uint32_t window_size, const m::wasm::MatchBase &child)
Emits code to write the result set of the Schema schema using the DataLayout created by factory.
Definition: WasmOperator.cpp:641

get_array_index_num_entries
U32x1 get_array_index_num_entries(const ThreadSafePooledString &table_name, const ThreadSafePooledString &attr_name)
Returns the number of entries of array index for table table_name and attribute attr_name.
Definition: WasmOperator.cpp:979

index_scan_codegen_compilation
void index_scan_codegen_compilation(const Index &index, const index_scan_bounds_t &bounds, const Match< IndexScan< IndexMethod > > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:1484

is_valid_bound
bool is_valid_bound(const ast::Expr &expr)
Returns true iff expr is a valid bound.
Definition: WasmOperator.cpp:1020

index_scan_resolve_index_method
void index_scan_resolve_index_method(const index_scan_bounds_t &bounds, const Match< IndexScan< IndexMethod > > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Resolves the index method and calls the appropriate codegen function.
Definition: WasmOperator.cpp:2119

INSTANTIATE
#define INSTANTIATE(CLASS)
Definition: WasmOperator.cpp:6562

get_base_address
Ptr< void > get_base_address(const ThreadSafePooledString &table_name)
Returns a pointer to the beginning of table table_name in the WebAssembly linear memory.
Definition: WasmOperator.cpp:971

get_num_rows
U32x1 get_num_rows(const ThreadSafePooledString &table_name)
Returns the number of rows of table table_name.
Definition: WasmOperator.cpp:963

compute_aggregate_info
std::pair< std::vector< aggregate_info_t >, std::unordered_map< Schema::Identifier, avg_aggregate_info_t > > compute_aggregate_info(const std::vector< std::reference_wrapper< const FnApplicationExpr > > &aggregates, const Schema &schema, std::size_t aggregates_offset=0)
Computes and returns information about the aggregates aggregates which are contained in the schema sc...
Definition: WasmOperator.cpp:824

index_scan_codegen_hybrid
void index_scan_codegen_hybrid(const Index &index, const index_scan_bounds_t &bounds, const Match< IndexScan< IndexMethod > > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:1901

index_scan_codegen_interpretation
void index_scan_codegen_interpretation(const Index &index, const index_scan_bounds_t &bounds, const Match< IndexScan< IndexMethod > > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:1785

RESOLVE_KEYTYPE
#define RESOLVE_KEYTYPE(INDEX)

extract_index_scan_bounds
index_scan_bounds_t extract_index_scan_bounds(const cnf::CNF &cnf)
Extracts the bounds for performing index scan from CNF cnf.
Definition: WasmOperator.cpp:1044

WasmOperator.hpp

M_WASM_OPERATOR_LIST_TEMPLATED
#define M_WASM_OPERATOR_LIST_TEMPLATED(X)
Definition: WasmOperator.hpp:244

M_WASM_MATCH_LIST
#define M_WASM_MATCH_LIST(X)
Definition: WasmOperator.hpp:321

Ptr

m::ArgParser::add
void add(const char *group_name, const char *short_name, const char *long_name, const char *description, Callback &&callback)
Adds a new group option to the ArgParser.
Definition: ArgParser.hpp:84

m::boolean
Check whether.
Definition: concepts.hpp:14

m::integral
Check whether.
Definition: concepts.hpp:23

m::wasm::sql_boolean_type
Definition: WasmUtil.hpp:407

fn.hpp

M_unreachable
#define M_unreachable(MSG)
Definition: macro.hpp:146

M_COMMA
#define M_COMMA(X)
Definition: macro.hpp:23

M_CONSTEXPR_COND
#define M_CONSTEXPR_COND(COND, IF_TRUE, IF_FALSE)
Definition: macro.hpp:54

M_notnull
#define M_notnull(ARG)
Definition: macro.hpp:182

M_insist
#define M_insist(...)
Definition: macro.hpp:129

M_LCOV_EXCL_START::indent
std::ostream & indent(std::ostream &out, unsigned indentation)
Start a new line with proper indentation.
Definition: DataLayout.cpp:100

m::ast
Definition: CardinalityEstimator.hpp:16

m::idx::IndexMethod::Rmi
@ Rmi

m::idx::IndexMethod::Array
@ Array

m::option_configs::IndexScanStrategy::HYBRID
@ HYBRID

m::option_configs::IndexScanStrategy::INTERPRETATION
@ INTERPRETATION

m::option_configs::IndexScanStrategy::COMPILATION
@ COMPILATION

m::option_configs::GroupingImplementation
GroupingImplementation
Definition: WasmOperator.hpp:28

m::option_configs::IndexImplementation
IndexImplementation
Definition: WasmOperator.hpp:47

m::option_configs::SortingImplementation
SortingImplementation
Definition: WasmOperator.hpp:34

m::option_configs::ScanImplementation
ScanImplementation
Definition: WasmOperator.hpp:22

m::option_configs::JoinImplementation
JoinImplementation
Definition: WasmOperator.hpp:40

m::option_configs::IndexScanMaterializationStrategy::MEMORY
@ MEMORY

m::option_configs::IndexScanMaterializationStrategy::INLINE
@ INLINE

m::option_configs::SoftPipelineBreakerStrategy
SoftPipelineBreakerStrategy
Definition: WasmOperator.hpp:53

m::option_configs::IndexScanCompilationStrategy::EXPOSED_MEMORY
@ EXPOSED_MEMORY

m::option_configs::IndexScanCompilationStrategy::CALLBACK
@ CALLBACK

m::option_configs::OrderingStrategy::BUILD_ON_LEFT
@ BUILD_ON_LEFT

m::option_configs::OrderingStrategy::BUILD_ON_RIGHT
@ BUILD_ON_RIGHT

m::options::simple_hash_join_ordering_strategy
option_configs::OrderingStrategy simple_hash_join_ordering_strategy
Which ordering strategy should be used for wasm::SimpleHashJoin.
Definition: WasmOperator.hpp:156

m::options::index_scan_strategy
option_configs::IndexScanStrategy index_scan_strategy
Which index scan strategy should be used for wasm::IndexScan.
Definition: WasmOperator.hpp:133

m::options::index_scan_materialization_strategy
option_configs::IndexScanMaterializationStrategy index_scan_materialization_strategy
Which materialization strategy should be used for wasm::IndexScan.
Definition: WasmOperator.hpp:140

m::options::sorted_attributes
std::vector< std::pair< m::Schema::Identifier, bool > > sorted_attributes
Which attributes are assumed to be sorted.
Definition: WasmOperator.hpp:226

m::options::double_pumping
bool double_pumping
Whether to use double pumping if SIMDfication is enabled.
Definition: WasmOperator.hpp:219

m::options::result_set_window_size
std::size_t result_set_window_size
Which window size should be used for the result set.
Definition: WasmOperator.hpp:210

m::options::simd_lanes
std::size_t simd_lanes
Which number of SIMD lanes to prefer.
Definition: WasmOperator.hpp:222

m::options::index_scan_compilation_strategy
option_configs::IndexScanCompilationStrategy index_scan_compilation_strategy
Which compilation strategy should be used for wasm::IndexScan.
Definition: WasmOperator.hpp:136

m::storage
Definition: Schema.hpp:29

m::storage::get_num_simd_lanes
std::size_t get_num_simd_lanes(const DataLayout &layout, const Schema &layout_schema, const Schema &tuple_schema)
Returns the number of SIMD lanes used for accessing tuples of schema tuple_schema in SIMDfied manner ...
Definition: DataLayout.cpp:244

m::storage::layout_schema
const Schema & layout_schema
Definition: DataLayout.hpp:255

m::wasm
Definition: V8Engine.hpp:11

m::wasm::strcmp
_I32x1 strcmp(NChar left, NChar right, bool reverse=false)
Compares two strings left and right.
Definition: WasmUtil.cpp:3270

m::wasm::strncmp
_I32x1 strncmp(NChar left, NChar right, U32x1 len, bool reverse=false)
Compares two strings left and right.
Definition: WasmUtil.cpp:3102

m::wasm::to
To ToL to()
Definition: WasmDSL.hpp:1986

m::wasm::can_be_null
bool can_be_null(const SQL_t &variant)
Definition: WasmUtil.hpp:452

m::wasm::not_null
Bool< L > not_null(SQL_t &variant)
Definition: WasmUtil.hpp:475

m::wasm::_Var
typename detail::_var_helper< T >::type _Var
Local variable that can always be NULL.
Definition: WasmDSL.hpp:5785

m::wasm::Var
typename detail::var_helper< T >::type Var
Local variable.
Definition: WasmDSL.hpp:5780

m::wasm::make_signed
auto make_signed()
Conversion of a PrimitiveExpr<T, L> to a PrimitiveExpr<std::make_signed_t<T>, L>.
Definition: WasmDSL.hpp:3651

m::wasm::GOTO
void GOTO(const Block &block)
Jumps to the end of block.
Definition: WasmDSL.hpp:6200

m::wasm::compile_load_point_access
void compile_load_point_access(const Schema &tuple_value_schema, const Schema &tuple_addr_schema, Ptr< void > base_address, const storage::DataLayout &layout, const Schema &layout_schema, U32x1 tuple_id)
Compiles the data layout layout starting at memory address base_address and containing tuples of sche...
Definition: WasmUtil.cpp:2480

m::wasm::and
and
Constructs a new PrimitiveExpr from a constant value.
Definition: WasmDSL.hpp:1520

m::wasm::L
std::size_t L
Definition: WasmDSL.hpp:528

m::wasm::Global
typename detail::global_helper< T >::type Global
Global variable.
Definition: WasmDSL.hpp:5790

m::wasm::value
Bool< L > value
Definition: WasmUtil.hpp:1317

m::wasm::is_null
Bool< L > is_null(SQL_t &variant)
Definition: WasmUtil.hpp:461

m::wasm::Select
auto Select(C &&_cond, T &&_tru, U &&_fals)
Definition: WasmDSL.hpp:6216

m::wasm::compile_load_sequential
std::tuple< Block, Block, Block > compile_load_sequential(const Schema &tuple_value_schema, const Schema &tuple_addr_schema, Ptr< void > base_address, const storage::DataLayout &layout, std::size_t num_simd_lanes, const Schema &layout_schema, Variable< uint32_t, Kind, false > &tuple_id)
Compiles the data layout layout containing tuples of schema layout_schema such that it sequentially l...

m::wasm::max
auto max(PrimitiveExpr< U, L > other) -> PrimitiveExpr< common_type_t< T, U >, L > std
Computes the maximum of this and other.
Definition: WasmDSL.hpp:2505

m::wasm::n
Bool< L > uint8_t n
Definition: WasmUtil.hpp:1318

m::wasm::discard
void discard()
Discards this.
Definition: WasmDSL.hpp:1589

m::wasm::U
PrimitiveExpr< uint64_t, L > L L L L U
Definition: WasmDSL.hpp:2353

m::wasm::res
for(std::size_t idx=1;idx< num_vectors;++idx) res.emplace((vectors_[idx].bitmask()<< uint32_t(idx *vector_type return * res
Definition: WasmDSL.hpp:3697

m::wasm::op
auto op
Definition: WasmDSL.hpp:2385

m::wasm::bool
std::size_t bool
Definition: WasmDSL.hpp:528

m::wasm::binary
PrimitiveExpr< ResultType, ResultL > binary(::wasm::BinaryOp op, PrimitiveExpr< OperandType, OperandL > other)
Helper function to implement binary operations.
Definition: WasmDSL.hpp:1618

m::wasm::clone
PrimitiveExpr clone() const
Creates and returns a deep copy of this.
Definition: WasmDSL.hpp:1578

m::wasm::min
and arithmetically_combinable< T, U, L > auto L auto L auto min(PrimitiveExpr< U, L > other) -> PrimitiveExpr< common_type_t< T, U >, L >
Definition: WasmDSL.hpp:2475

m::wasm::LE
@ LE
Definition: WasmUtil.hpp:1337

m::wasm::NE
@ NE
Definition: WasmUtil.hpp:1337

m::wasm::LT
@ LT
Definition: WasmUtil.hpp:1337

m::wasm::num_simd_lanes
static constexpr std::size_t num_simd_lanes
‍the number of SIMD lanes of the represented expression, i.e. 1 for scalar and at least 2 for vectori...
Definition: WasmDSL.hpp:1467

m
‍mutable namespace
Definition: Backend.hpp:10

m::pipeline_t
std::function< void(void)> pipeline_t
Definition: PhysicalOptimizer.hpp:157

m::streq
bool streq(const char *first, const char *second)
Definition: fn.hpp:29

m::strneq
bool strneq(const char *first, const char *second, std::size_t n)
Definition: fn.hpp:30

m::contains
bool M_EXPORT contains(const H &haystack, const N &needle)
Checks whether haystack contains needle.
Definition: fn.hpp:383

m::T
T(x)

m::and
and
Definition: enum_ops.hpp:12

m::U
and arithmetic< U > and same_signedness< T, U > U
Definition: concepts.hpp:90

m::init
bool M_EXPORT init(void)
Initializes the mu*t*able library.
Definition: mutable.cpp:23

m::visit
auto visit(Callable &&callable, Base &obj, m::tag< Callable > &&=m::tag< Callable >())
Generic implementation to visit a class hierarchy, with similar syntax as std::visit.
Definition: Visitor.hpp:138

m::register_wasm_operators
void register_wasm_operators(PhysicalOptimizer &phys_opt)
Registers physical Wasm operators in phys_opt depending on the set CLI options.
Definition: WasmOperator.cpp:542

std
STL namespace.

aggregate_info_t
‍helper struct for aggregates
Definition: WasmOperator.cpp:803

aggregate_info_t::entry
Schema::entry_type entry
aggregate entry consisting of identifier, type, and constraints
Definition: WasmOperator.cpp:804

aggregate_info_t::args
const std::vector< std::unique_ptr< ast::Expr > > & args
aggregate arguments
Definition: WasmOperator.cpp:806

aggregate_info_t::fnid
m::Function::fnid_t fnid
aggregate function
Definition: WasmOperator.cpp:805

avg_aggregate_info_t
‍helper struct for AVG aggregates
Definition: WasmOperator.cpp:811

avg_aggregate_info_t::running_count
Schema::Identifier running_count
identifier of running count
Definition: WasmOperator.cpp:812

avg_aggregate_info_t::sum
Schema::Identifier sum
potential identifier for sum (only set if AVG is computed once at the end)
Definition: WasmOperator.cpp:813

avg_aggregate_info_t::compute_running_avg
bool compute_running_avg
flag whether running AVG must be computed instead of one computation at the end
Definition: WasmOperator.cpp:814

index_scan_bounds_t
‍helper struct holding the bounds for index scan
Definition: WasmOperator.cpp:1013

index_scan_bounds_t::is_inclusive_hi
bool is_inclusive_hi
flag to indicate if bounds are inclusive
Definition: WasmOperator.cpp:1016

index_scan_bounds_t::attribute
Schema::entry_type attribute
Attribute for which bounds should hold.
Definition: WasmOperator.cpp:1014

index_scan_bounds_t::hi
std::optional< std::reference_wrapper< const ast::Expr > > hi
lo and hi bounds
Definition: WasmOperator.cpp:1015

index_scan_bounds_t::lo
std::optional< std::reference_wrapper< const ast::Expr > > lo
Definition: WasmOperator.cpp:1015

index_scan_bounds_t::is_inclusive_lo
bool is_inclusive_lo
Definition: WasmOperator.cpp:1016

m::Block
A block of size N contains N tuples.
Definition: Interpreter.hpp:20

m::Boolean
The boolean type.
Definition: Type.hpp:230

m::Catalog
The catalog contains all Databases and keeps track of all meta information of the database system.
Definition: Catalog.hpp:215

m::Catalog::get_database_in_use
Database & get_database_in_use()
Returns a reference to the Database that is currently in use, if any.
Definition: Catalog.hpp:295

m::Catalog::pool
ThreadSafePooledString pool(const char *str) const
Creates an internalized copy of the string str by adding it to the internal StringPool.
Definition: Catalog.hpp:274

m::Catalog::Get
static Catalog & Get()
Return a reference to the single Catalog instance.

m::Catalog::arg_parser
m::ArgParser & arg_parser()
Definition: Catalog.hpp:253

m::CharacterSequence
The type of character strings, both fixed length and varying length.
Definition: Type.hpp:290

m::ConditionPropertyMap
Definition: Condition.hpp:19

m::ConditionPropertyMap::find
auto find(const Schema::Identifier &id) const
Definition: Condition.hpp:61

m::ConditionPropertyMap::merge
void merge(ConditionPropertyMap &other)
Definition: Condition.hpp:48

m::ConditionPropertyMap::empty
bool empty() const
Definition: Condition.hpp:92

m::ConditionPropertyMap::cend
auto cend() const
Definition: Condition.hpp:90

m::ConditionPropertyMap::add
void add(Schema::Identifier id, Property P)
Definition: Condition.hpp:36

m::ConditionSet
Definition: Condition.hpp:272

m::ConditionSet::get_condition
Cond & get_condition()
Definition: Condition.hpp:305

m::ConditionSet::Make_Unsatisfiable
static ConditionSet Make_Unsatisfiable()
Definition: Condition.hpp:323

m::ConditionSet::add_condition
void add_condition(Cond &&cond)
Definition: Condition.hpp:289

m::ConditionSet::project_and_rename
void project_and_rename(const std::vector< std::pair< Schema::Identifier, Schema::Identifier > > &old2new)
Definition: Condition.cpp:19

m::ConditionSet::add_or_replace_condition
void add_or_replace_condition(Cond &&cond)
Definition: Condition.hpp:298

m::Database::name
ThreadSafePooledString name
the name of the database
Definition: Schema.hpp:892

m::DateTime
The date type.
Definition: Type.hpp:364

m::Date
The date type.
Definition: Type.hpp:335

m::FilterOperator
Definition: Operator.hpp:279

m::Function::fnid_t
fnid_t
Definition: Schema.hpp:833

m::MatchBase::execute
virtual void execute(setup_t setup, pipeline_t pipeline, teardown_t teardown) const =0
Executes this physical operator match.

m::MatchBase::print
virtual void print(std::ostream &out, unsigned level=0) const =0

m::Match
Definition: PhysicalOptimizer.hpp:16

m::NoSIMD
Definition: Condition.hpp:234

m::Numeric
The numeric type represents integer and floating-point types of different precision and scale.
Definition: Type.hpp:393

m::OperatorInformation::estimated_cardinality
double estimated_cardinality
‍the estimated cardinality of the result set of this Operator
Definition: Operator.hpp:33

m::Operator
An Operator represents an operation in a query plan.
Definition: Operator.hpp:45

m::Operator::info
OperatorInformation & info()
Definition: Operator.hpp:72

m::Operator::has_info
bool has_info() const
Definition: Operator.hpp:71

m::PhysicalOptimizer
The physical optimizer interface.
Definition: PhysicalOptimizer.hpp:260

m::PhysicalOptimizer::register_operator
void register_operator()
Registers a new physical operator which then may be used to find a covering.
Definition: PhysicalOptimizer.hpp:677

m::Pooled
A data type representing a pooled (or internalized) object.
Definition: Pool.hpp:168

m::Predicated
Definition: Condition.hpp:239

m::SIMD
Definition: Condition.hpp:201

m::ScanOperator
Definition: Operator.hpp:252

m::Schema::Identifier
An Identifier is composed of a name and an optional prefix.
Definition: Schema.hpp:42

m::Schema::Identifier::name
ThreadSafePooledString name
the name of this Identifier
Definition: Schema.hpp:48

m::Schema::entry_type
Definition: Schema.hpp:77

m::Schema::entry_type::CreateArtificial
static entry_type CreateArtificial()
Definition: Schema.hpp:100

m::Schema::entry_type::NOT_NULLABLE
@ NOT_NULLABLE
entry must not be NULL
Definition: Schema.hpp:80

m::Schema::entry_type::id
Identifier id
Definition: Schema.hpp:86

m::Schema
A Schema represents a sequence of identifiers, optionally with a prefix, and their associated types.
Definition: Schema.hpp:39

m::Schema::num_entries
std::size_t num_entries() const
Returns the number of entries in this Schema.
Definition: Schema.hpp:124

m::Schema::deduplicate
Schema deduplicate() const
Returns a deduplicated version of this Schema, i.e.
Definition: Schema.hpp:190

m::Schema::find
iterator find(const Identifier &id)
Returns an iterator to the entry with the given Identifier id, or end() if no such entry exists.
Definition: Schema.hpp:129

m::Schema::add
void add(entry_type e)
Adds the entry e to this Schema.
Definition: Schema.hpp:181

m::Schema::drop_constants
Schema drop_constants() const
Returns a copy of this Schema where all constant entries are removed.
Definition: Schema.hpp:200

m::Schema::has
bool has(const Identifier &id) const
Returns true iff this Schema contains an entry with Identifier id.
Definition: Schema.hpp:140

m::Sortedness
Definition: Condition.hpp:149

m::Sortedness::orders
order_t & orders()
Definition: Condition.hpp:168

m::Sortedness::O_UNDEF
@ O_UNDEF
Definition: Condition.hpp:150

m::Sortedness::O_ASC
@ O_ASC
Definition: Condition.hpp:150

m::Sortedness::O_DESC
@ O_DESC
Definition: Condition.hpp:150

m::Type
This class represents types in the SQL type system.
Definition: Type.hpp:46

m::Type::Get_Double
static Pooled< Numeric > Get_Double(category_t category)
Returns a Numeric type of given category for 64 bit floating-points.
Definition: Type.cpp:104

m::Type::Get_Integer
static Pooled< Numeric > Get_Integer(category_t category, unsigned num_bytes)
Returns a Numeric type for integrals of given category and num_bytes bytes.
Definition: Type.cpp:94

m::WasmEngine::Get_Wasm_Context_By_ID
static WasmContext & Get_Wasm_Context_By_ID(unsigned id)
Returns a reference to the WasmContext with ID id.
Definition: WebAssembly.hpp:110

m::ast::BinaryExpr
A binary expression.
Definition: AST.hpp:348

m::ast::Constant
A constant: a string literal or a numeric constant.
Definition: AST.hpp:213

m::ast::Designator
A designator.
Definition: AST.hpp:134

m::ast::ErrorExpr
The error expression.
Definition: AST.hpp:116

m::ast::Expr
An expression.
Definition: AST.hpp:39

m::ast::Expr::type
const Type * type() const
Returns the Type of this Expr.
Definition: AST.hpp:58

m::ast::Expr::can_be_null
virtual bool can_be_null() const =0
Returns true iff this Expr is nullable, i.e.

m::ast::FnApplicationExpr
A function application.
Definition: AST.hpp:246

m::ast::QueryExpr
A query expression for nested queries.
Definition: AST.hpp:389

m::ast::Token
Definition: Token.hpp:14

m::ast::Token::CreateArtificial
static Token CreateArtificial(TokenType type=TK_EOF)
Definition: Token.hpp:29

m::cnf::CNF
A CNF represents a conjunction of cnf::Clauses.
Definition: CNF.hpp:134

m::cnf::CNF::get_required
Schema get_required() const
Returns a Schema instance containing all required definitions (of Attributes and other Designators).
Definition: CNF.hpp:138

m::cnf::Clause
A cnf::Clause represents a disjunction of Predicates.
Definition: CNF.hpp:87

m::cnf::Predicate
A Predicate contains a Expr of Boolean type in either positive or negative form.
Definition: CNF.hpp:16

m::idx::ArrayIndex
A simple index based on a sorted array that maps keys to their tuple_id.
Definition: Index.hpp:58

m::idx::RecursiveModelIndex
A recursive model index with two layers consiting only of linear monels that maps keys to their tuple...
Definition: Index.hpp:163

m::invalid_argument
Signals that an argument to a function of method was invalid.
Definition: exception.hpp:37

m::overloaded
Definition: fn.hpp:455

m::setup_t
Definition: PhysicalOptimizer.hpp:160

m::setup_t::Make_Without_Parent
static setup_t Make_Without_Parent(base_t &&callback=base_t())
Definition: PhysicalOptimizer.hpp:176

m::storage::DataLayoutFactory
This is an interface for factories that compute particular DataLayouts for a given sequence of Types,...
Definition: DataLayoutFactory.hpp:17

m::storage::DataLayoutFactory::clone
virtual std::unique_ptr< DataLayoutFactory > clone() const =0
Creates and returns a deep copy of this.

m::storage::PAXLayoutFactory::block_size_t
block_size_t
Definition: DataLayoutFactory.hpp:63

m::storage::PAXLayoutFactory::NBytes
@ NBytes
Definition: DataLayoutFactory.hpp:63

m::storage::PAXLayoutFactory::NTuples
@ NTuples
Definition: DataLayoutFactory.hpp:63

m::tag
Definition: tag.hpp:8

m::teardown_t
Definition: PhysicalOptimizer.hpp:180

m::teardown_t::Make_Without_Parent
static teardown_t Make_Without_Parent(base_t &&callback=base_t())
Definition: PhysicalOptimizer.hpp:196

m::visit_skip_subtree
Exception class which can be thrown to skip recursion of the subtree in pre-order visitors.
Definition: Visitor.hpp:18

m::visit_stop_recursion
Exception class which can be thrown to stop entire recursion in visitors.
Definition: Visitor.hpp:16

m::wasm::Aggregation
Definition: WasmOperator.hpp:479

m::wasm::Aggregation::post_condition
static ConditionSet post_condition(const Match< Aggregation > &M)
Definition: WasmOperator.cpp:3892

m::wasm::Aggregation::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const AggregationOperator * > &partial_inner_nodes)
Definition: WasmOperator.cpp:3883

m::wasm::Aggregation::execute
static void execute(const Match< Aggregation > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:3911

m::wasm::Aggregation::agg_t_
std::variant< var_t_< IsGlobal, I64< L > >, std::pair< var_t_< IsGlobal, I8< L > >, var_t_< IsGlobal, Bool< L > > >, std::pair< var_t_< IsGlobal, I16< L > >, var_t_< IsGlobal, Bool< L > > >, std::pair< var_t_< IsGlobal, I32< L > >, var_t_< IsGlobal, Bool< L > > >, std::pair< var_t_< IsGlobal, I64< L > >, var_t_< IsGlobal, Bool< L > > >, std::pair< var_t_< IsGlobal, Float< L > >, var_t_< IsGlobal, Bool< L > > >, std::pair< var_t_< IsGlobal, Double< L > >, var_t_< IsGlobal, Bool< L > > > > agg_t_
Definition: WasmOperator.hpp:492

m::wasm::Block
Represents a code block, i.e.
Definition: WasmDSL.hpp:1006

m::wasm::Block::attach_to_current
void attach_to_current()
Attaches this Block to the wasm::Block currently active in the Module.
Definition: WasmDSL.hpp:1085

m::wasm::Buffer
Buffers tuples by materializing them into memory.
Definition: WasmUtil.hpp:1070

m::wasm::Buffer::resume_pipeline
void resume_pipeline(param_t tuple_value_schema=param_t(), param_t tuple_addr_schema=param_t()) const
Emits code into a separate function to resume the pipeline for each value tuple of schema tuple_value...
Definition: WasmUtil.cpp:2679

m::wasm::Buffer::base_address
Ptr< void > base_address() const
Returns the base address of the buffer.
Definition: WasmUtil.hpp:1110

m::wasm::Buffer::consume
void consume()
Emits code to store the current tuple into the buffer.
Definition: WasmUtil.cpp:2910

m::wasm::Buffer::setup
void setup()
Performs the setup of all local variables of this buffer (by reading them from the global backups iff...
Definition: WasmUtil.cpp:2583

m::wasm::Buffer::teardown
void teardown()
Performs the teardown of all local variables of this buffer (by storing them into the global backups ...
Definition: WasmUtil.cpp:2642

m::wasm::Buffer::size
U32x1 size() const
Returns the current size of the buffer.
Definition: WasmUtil.hpp:1119

m::wasm::Callback
Definition: WasmOperator.hpp:371

m::wasm::Callback::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const CallbackOperator * > &partial_inner_nodes)
Definition: WasmOperator.cpp:1164

m::wasm::Callback::execute
static void execute(const Match< Callback > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:1182

m::wasm::CodeGenContext::get_literal_raw_address
uint32_t get_literal_raw_address(const char *literal) const
Returns the raw address at which literal is stored.
Definition: WasmUtil.hpp:926

m::wasm::CodeGenContext::inc_num_tuples
void inc_num_tuples(U32x1 n=U32x1(1))
Increments the number of result tuples produced by n.
Definition: WasmUtil.hpp:914

m::wasm::CodeGenContext::num_tuples
U32x1 num_tuples() const
Returns the number of result tuples produced.
Definition: WasmUtil.hpp:910

m::wasm::CodeGenContext::num_simd_lanes
std::size_t num_simd_lanes() const
Returns the number of SIMD lanes used.
Definition: WasmUtil.hpp:939

m::wasm::CodeGenContext::get_literal_address
NChar get_literal_address(const char *literal) const
Returns the address at which literal is stored.
Definition: WasmUtil.hpp:932

m::wasm::CodeGenContext::num_simd_lanes_preferred
std::size_t num_simd_lanes_preferred() const
Returns the number of SIMD lanes preferred by other operators.
Definition: WasmUtil.hpp:944

m::wasm::CodeGenContext::env
Environment & env()
Returns the current Environment.
Definition: WasmUtil.hpp:905

m::wasm::CodeGenContext::set_num_simd_lanes
void set_num_simd_lanes(std::size_t n)
Sets the number of SIMD lanes used to n.
Definition: WasmUtil.hpp:941

m::wasm::CodeGenContext::update_num_simd_lanes_preferred
void update_num_simd_lanes_preferred(std::size_t n)
Updates the number of SIMD lanes preferred by n.
Definition: WasmUtil.hpp:946

m::wasm::CodeGenContext::set_num_tuples
void set_num_tuples(U32x1 n)
Set the number of result tuples produced to n.
Definition: WasmUtil.hpp:912

m::wasm::CodeGenContext::Get
static CodeGenContext & Get()
Definition: WasmUtil.hpp:889

m::wasm::CodeGenContext::scoped_environment
Scope scoped_environment()
Creates a new, scoped Environment.
Definition: WasmUtil.hpp:897

m::wasm::Environment
Binds Schema::Identifiers to Expr<T>s.
Definition: WasmUtil.hpp:563

m::wasm::Environment::compile
auto compile(T &&t) const
‍Compile t by delegating compilation to an ExprCompiler for this Environment.
Definition: WasmUtil.hpp:742

m::wasm::Environment::add_predicate
void add_predicate(SQL_boolean_t &&pred)
‍Adds the predicate pred to the predication predicate.
Definition: WasmUtil.hpp:759

m::wasm::Environment::add
void add(Schema::Identifier id, T &&expr)
‍Adds a mapping from id to expr.
Definition: WasmUtil.hpp:619

m::wasm::Environment::get
SQL_t get(const Schema::Identifier &id) const
‍Returns the copied entry for identifier id.
Definition: WasmUtil.hpp:699

m::wasm::Environment::extract_predicate
SQL_boolean_t extract_predicate()
‍Returns the moved current predication predicate.
Definition: WasmUtil.hpp:779

m::wasm::Environment::has
bool has(const Schema::Identifier &id) const
Returns true iff this Environment contains id.
Definition: WasmUtil.hpp:587

m::wasm::Expr
Definition: WasmDSL.hpp:86

m::wasm::Filter
Definition: WasmOperator.hpp:409

m::wasm::Filter::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const FilterOperator * > &partial_inner_nodes)
Definition: WasmOperator.cpp:2215

m::wasm::Filter::adapt_post_condition
static ConditionSet adapt_post_condition(const Match< Filter > &M, const ConditionSet &post_cond_child)
Definition: WasmOperator.cpp:2230

m::wasm::Filter::cost
static double cost(const Match< Filter > &)
Definition: WasmOperator.cpp:2243

m::wasm::Filter::execute
static void execute(const Match< Filter > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:2253

m::wasm::FunctionProxy
A handle to create a Function and to create invocations of that function.
Definition: WasmDSL.hpp:1368

m::wasm::HashBasedGroupJoin
Definition: WasmOperator.hpp:570

m::wasm::HashBasedGroupJoin::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const GroupingOperator *, const JoinOperator *, const Wildcard *, const Wildcard * > &partial_inner_nodes)
Definition: WasmOperator.cpp:5525

m::wasm::HashBasedGroupJoin::cost
static double cost(const Match< HashBasedGroupJoin > &)
Definition: WasmOperator.cpp:5568

m::wasm::HashBasedGroupJoin::post_condition
static ConditionSet post_condition(const Match< HashBasedGroupJoin > &M)
Definition: WasmOperator.cpp:5574

m::wasm::HashBasedGroupJoin::execute
static void execute(const Match< HashBasedGroupJoin > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:5587

m::wasm::HashBasedGrouping
Definition: WasmOperator.hpp:435

m::wasm::HashBasedGrouping::cost
static double cost(const Match< HashBasedGrouping > &)
Definition: WasmOperator.cpp:2513

m::wasm::HashBasedGrouping::post_condition
static ConditionSet post_condition(const Match< HashBasedGrouping > &M)
Definition: WasmOperator.cpp:2518

m::wasm::HashBasedGrouping::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const GroupingOperator * > &partial_inner_nodes)
Definition: WasmOperator.cpp:2501

m::wasm::HashBasedGrouping::execute
static void execute(const Match< HashBasedGrouping > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:2531

m::wasm::HashTable::the_entry
Helper struct as proxy to access a hash table entry.
Definition: WasmAlgo.hpp:369

m::wasm::HashTable::the_entry::get
value_t get(const Schema::Identifier &id) const
‍Returns the copied entry for identifier id.
Definition: WasmAlgo.hpp:462

m::wasm::HashTable::the_entry::extract
value_t extract(const Schema::Identifier &id)
‍Returns the moved entry for identifier id.
Definition: WasmAlgo.hpp:443

m::wasm::HashTable::the_reference
Helper struct as proxy to access a single value (inclusive NULL bit) of a hash table entry.
Definition: WasmAlgo.hpp:66

m::wasm::IndexScan
Definition: WasmOperator.hpp:399

m::wasm::IndexScan::cost
static double cost(const Match< IndexScan > &M)
Definition: WasmOperator.cpp:1477

m::wasm::IndexScan::execute
static void execute(const Match< IndexScan > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:2191

m::wasm::IndexScan::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const FilterOperator *, const ScanOperator * > &partial_inner_nodes)
Definition: WasmOperator.cpp:1350

m::wasm::IndexScan::post_condition
static ConditionSet post_condition(const Match< IndexScan > &M)
Definition: WasmOperator.cpp:1451

m::wasm::LazyDisjunctiveFilter
Definition: WasmOperator.hpp:418

m::wasm::LazyDisjunctiveFilter::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const FilterOperator * > &partial_inner_nodes)
Definition: WasmOperator.cpp:2281

m::wasm::LazyDisjunctiveFilter::cost
static double cost(const Match< LazyDisjunctiveFilter > &M)
Definition: WasmOperator.cpp:2293

m::wasm::LazyDisjunctiveFilter::execute
static void execute(const Match< LazyDisjunctiveFilter > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:2300

m::wasm::Limit
Definition: WasmOperator.hpp:561

m::wasm::Limit::execute
static void execute(const Match< Limit > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:5468

m::wasm::Limit::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const LimitOperator * > &partial_inner_nodes)
Definition: WasmOperator.cpp:5456

m::wasm::LinearProbing
Linear probing strategy, i.e.
Definition: WasmAlgo.hpp:1018

m::wasm::MatchBase
An abstract MatchBase for the WasmV8 backend.
Definition: WasmOperator.hpp:615

m::wasm::Module::get_global
PrimitiveExpr< T, L > get_global(const char *name)
Definition: WasmDSL.hpp:6710

m::wasm::Module::Get
static Module & Get()
Definition: WasmDSL.hpp:715

m::wasm::Module::Allocator
friend struct Allocator
Definition: WasmDSL.hpp:653

m::wasm::Module::ID
static unsigned ID()
Returns the ID of the current module.
Definition: WasmDSL.hpp:722

m::wasm::Module::emit_call
void emit_call(const char *fn, PrimitiveExpr< ParamTypes, ParamLs >... args)
Definition: WasmDSL.hpp:6717

m::wasm::NChar
Definition: WasmUtil.hpp:32

m::wasm::NestedLoopsJoin
Definition: WasmOperator.hpp:522

m::wasm::NestedLoopsJoin::execute
static void execute(const Match< NestedLoopsJoin > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:4847

m::wasm::NestedLoopsJoin::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const JoinOperator * > &partial_inner_nodes)
Definition: WasmOperator.cpp:4810

m::wasm::NestedLoopsJoin::cost
static double cost(const Match< NestedLoopsJoin > &M)
Definition: WasmOperator.cpp:4838

m::wasm::NestedLoopsJoin::adapt_post_conditions
static ConditionSet adapt_post_conditions(const Match< NestedLoopsJoin > &M, std::vector< std::reference_wrapper< const ConditionSet > > &&post_cond_children)
Definition: WasmOperator.cpp:4821

m::wasm::NoOpSorting
Definition: WasmOperator.hpp:513

m::wasm::NoOpSorting::execute
static void execute(const Match< NoOpSorting > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:4799

m::wasm::NoOpSorting::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const SortingOperator * > &partial_inner_nodes)
Definition: WasmOperator.cpp:4780

m::wasm::NoOp
Definition: WasmOperator.hpp:364

m::wasm::NoOp::execute
static void execute(const Match< NoOp > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:1125

m::wasm::OrderedGrouping
Definition: WasmOperator.hpp:444

m::wasm::OrderedGrouping::agg_t_
std::variant< var_t_< IsGlobal, I64x1 >, std::pair< var_t_< IsGlobal, I8x1 >, std::optional< var_t_< IsGlobal, Boolx1 > > >, std::pair< var_t_< IsGlobal, I16x1 >, std::optional< var_t_< IsGlobal, Boolx1 > > >, std::pair< var_t_< IsGlobal, I32x1 >, std::optional< var_t_< IsGlobal, Boolx1 > > >, std::pair< var_t_< IsGlobal, I64x1 >, std::optional< var_t_< IsGlobal, Boolx1 > > >, std::pair< var_t_< IsGlobal, Floatx1 >, std::optional< var_t_< IsGlobal, Boolx1 > > >, std::pair< var_t_< IsGlobal, Doublex1 >, std::optional< var_t_< IsGlobal, Boolx1 > > > > agg_t_
Definition: WasmOperator.hpp:457

m::wasm::OrderedGrouping::adapt_post_condition
static ConditionSet adapt_post_condition(const Match< OrderedGrouping > &M, const ConditionSet &post_cond_child)
Definition: WasmOperator.cpp:2983

m::wasm::OrderedGrouping::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const GroupingOperator * > &partial_inner_nodes)
Definition: WasmOperator.cpp:2955

m::wasm::OrderedGrouping::key_t_
std::variant< var_t_< IsGlobal, Ptr< Charx1 > >, std::pair< var_t_< IsGlobal, Boolx1 >, std::optional< var_t_< IsGlobal, Boolx1 > > >, std::pair< var_t_< IsGlobal, I8x1 >, std::optional< var_t_< IsGlobal, Boolx1 > > >, std::pair< var_t_< IsGlobal, I16x1 >, std::optional< var_t_< IsGlobal, Boolx1 > > >, std::pair< var_t_< IsGlobal, I32x1 >, std::optional< var_t_< IsGlobal, Boolx1 > > >, std::pair< var_t_< IsGlobal, I64x1 >, std::optional< var_t_< IsGlobal, Boolx1 > > >, std::pair< var_t_< IsGlobal, Floatx1 >, std::optional< var_t_< IsGlobal, Boolx1 > > >, std::pair< var_t_< IsGlobal, Doublex1 >, std::optional< var_t_< IsGlobal, Boolx1 > > > > key_t_
Definition: WasmOperator.hpp:468

m::wasm::OrderedGrouping::cost
static double cost(const Match< OrderedGrouping > &)
Definition: WasmOperator.cpp:2978

m::wasm::OrderedGrouping::execute
static void execute(const Match< OrderedGrouping > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:3009

m::wasm::PrimitiveExpr
Definition: WasmDSL.hpp:85

m::wasm::Print
Definition: WasmOperator.hpp:380

m::wasm::Print::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const PrintOperator * > &partial_inner_nodes)
Definition: WasmOperator.cpp:1196

m::wasm::Print::execute
static void execute(const Match< Print > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:1214

m::wasm::Projection
Definition: WasmOperator.hpp:426

m::wasm::Projection::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const ProjectionOperator * > &partial_inner_nodes)
Definition: WasmOperator.cpp:2334

m::wasm::Projection::execute
static void execute(const Match< Projection > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:2408

m::wasm::Projection::adapt_post_condition
static ConditionSet adapt_post_condition(const Match< Projection > &M, const ConditionSet &post_cond_child)
Definition: WasmOperator.cpp:2378

m::wasm::QuadraticProbing
Quadratic probing strategy, i.e.
Definition: WasmAlgo.hpp:1028

m::wasm::Quicksort
Definition: WasmOperator.hpp:504

m::wasm::Quicksort::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const SortingOperator * > &partial_inner_nodes)
Definition: WasmOperator.cpp:4713

m::wasm::Quicksort::execute
static void execute(const Match< Quicksort > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:4749

m::wasm::Quicksort::post_condition
static ConditionSet post_condition(const Match< Quicksort > &M)
Definition: WasmOperator.cpp:4726

m::wasm::Scan
Definition: WasmOperator.hpp:389

m::wasm::Scan::post_condition
static ConditionSet post_condition(const Match< Scan > &M)
Definition: WasmOperator.cpp:1252

m::wasm::Scan::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const ScanOperator * > &partial_inner_nodes)
Definition: WasmOperator.cpp:1228

m::wasm::Scan::execute
static void execute(const Match< Scan > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:1286

m::wasm::SimpleHashJoin
Definition: WasmOperator.hpp:534

m::wasm::SimpleHashJoin::cost
static double cost(const Match< SimpleHashJoin > &M)
Definition: WasmOperator.cpp:4989

m::wasm::SimpleHashJoin::adapt_post_conditions
static ConditionSet adapt_post_conditions(const Match< SimpleHashJoin > &M, std::vector< std::reference_wrapper< const ConditionSet > > &&post_cond_children)
Definition: WasmOperator.cpp:4969

m::wasm::SimpleHashJoin::execute
static void execute(const Match< SimpleHashJoin > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:5001

m::wasm::SimpleHashJoin::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const JoinOperator *, const Wildcard *, const Wildcard * > &partial_inner_nodes)
Definition: WasmOperator.cpp:4930

m::wasm::SortMergeJoin
Definition: WasmOperator.hpp:549

m::wasm::SortMergeJoin::pre_condition
static ConditionSet pre_condition(std::size_t child_idx, const std::tuple< const JoinOperator *, const Wildcard *, const Wildcard * > &partial_inner_nodes)
Definition: WasmOperator.cpp:5168

m::wasm::SortMergeJoin::cost
static double cost(const Match< SortMergeJoin > &M)
Definition: WasmOperator.cpp:5282

m::wasm::SortMergeJoin::adapt_post_conditions
static ConditionSet adapt_post_conditions(const Match< SortMergeJoin > &M, std::vector< std::reference_wrapper< const ConditionSet > > &&post_cond_children)
Definition: WasmOperator.cpp:5233

m::wasm::SortMergeJoin::execute
static void execute(const Match< SortMergeJoin > &M, setup_t setup, pipeline_t pipeline, teardown_t teardown)
Definition: WasmOperator.cpp:5297

m::wasm::ThePostOrderMatchBaseVisitor
Definition: WasmOperator.hpp:1262

m::wasm::ThePostOrderMatchBaseVisitor::operator()
void operator()(Const< MatchBase > &)
Definition: WasmOperator.cpp:6552

m::wasm::ThePostOrderMatchBaseVisitor::Const
typename super::template Const< T > Const
Definition: WasmOperator.hpp:1264

m::wasm::ThePreOrderMatchBaseVisitor
Definition: WasmOperator.hpp:1251

m::wasm::ThePreOrderMatchBaseVisitor::Const
typename super::template Const< T > Const
Definition: WasmOperator.hpp:1253

m::wasm::ThePreOrderMatchBaseVisitor::operator()
void operator()(Const< MatchBase > &)
Definition: WasmOperator.cpp:6546

m::wasm::TheRecursiveMatchBaseVisitorBase
A generic base class for implementing recursive wasm::MatchBase visitors.
Definition: WasmOperator.hpp:1233

m::wasm::expr
Helper type to deduce the Expr<U> type given a.
Definition: WasmDSL.hpp:160

print_info
Definition: WasmOperator.cpp:6261

print_info::op
const Operator & op
Definition: WasmOperator.cpp:6262

print_info::operator<<
friend std::ostream & operator<<(std::ostream &out, const print_info &info)
Definition: WasmOperator.cpp:6264