/*++ Copyright (c) 2015 Microsoft Corporation Module Name: dataflow.h Abstract: Generic bottom-up and top-down data-flow engine for analysis of rule sets. Author: Henning Guenther (t-hennig) --*/ #pragma once #include "muz/base/dl_rule.h" #include "muz/base/dl_rule_set.h" #include "util/hashtable.h" #include "util/vector.h" namespace datalog { template class fact_reader; template class fact_writer; /* The structure of fact classes: class fact { public: typedef ... ctx_t; // Empty fact static fact null_fact; fact(); -- bottom // Init (Top down) void init_down(ctx_t& ctx, const rule* r); // Init (Bottom up) bool init_up(ctx_t& ctx, const rule* r); // Step (Bottom up) bool propagate_up(ctx_t& ctx, const rule* r, const fact_reader& tail_facts); // Step (Top down) void propagate_down(ctx_t& ctx, const rule* r, fact_writer& tail_facts) const; // Debugging void dump(ctx_t& ctx, std::ostream& outp) const; // Union void join(ctx_t& ctx, const Fact& oth); // Intersection void intersect(ctx_t& ctx, const Fact& oth); }; */ template class dataflow_engine { public: typedef map, ptr_eq > fact_db; typedef hashtable, ptr_eq > todo_set; typedef typename fact_db::iterator iterator; private: const rule_set& m_rules; fact_db m_facts; todo_set m_todo[2]; unsigned m_todo_idx; typename Fact::ctx_t& m_context; rule_set::decl2rules m_body2rules; void init_bottom_up() { for (rule* cur : m_rules) { for (unsigned i = 0; i < cur->get_uninterpreted_tail_size(); ++i) { func_decl *d = cur->get_decl(i); auto& value = m_body2rules.insert_if_not_there(d, nullptr); if (!value) { value = alloc(ptr_vector); } value->push_back(cur); } if (cur->get_positive_tail_size() == 0) { func_decl *sym = cur->get_head()->get_decl(); bool new_info = m_facts.insert_if_not_there(sym, Fact()).init_up(m_context, cur); if (new_info) { m_todo[m_todo_idx].insert(sym); } } } } void init_top_down() { for (func_decl* sym : m_rules.get_output_predicates()) { TRACE("dl", tout << sym->get_name() << "\n";); const rule_vector& output_rules = m_rules.get_predicate_rules(sym); for (rule* r : output_rules) { m_facts.insert_if_not_there(sym, Fact()).init_down(m_context, r); m_todo[m_todo_idx].insert(sym); } } } void step_bottom_up() { for (func_decl* f : m_todo[m_todo_idx]) { ptr_vector * rules; if (!m_body2rules.find(f, rules)) continue; for (rule* r : *rules) { func_decl* head_sym = r->get_head()->get_decl(); fact_reader tail_facts(m_facts, r); bool new_info = m_facts.insert_if_not_there(head_sym, Fact()).propagate_up(m_context, r, tail_facts); if (new_info) { m_todo[!m_todo_idx].insert(head_sym); } } } // Update todo list m_todo[m_todo_idx].reset(); m_todo_idx = !m_todo_idx; } void step_top_down() { for (func_decl* head_sym : m_todo[m_todo_idx]) { // We can't use a reference here because we are changing the map while using the reference const Fact head_fact = m_facts.get(head_sym, Fact::null_fact); const rule_vector& deps = m_rules.get_predicate_rules(head_sym); for (rule* trg_rule : deps) { fact_writer writer(m_facts, trg_rule, m_todo[!m_todo_idx]); // Generate new facts head_fact.propagate_down(m_context, trg_rule, writer); } } // Update todo list m_todo[m_todo_idx].reset(); m_todo_idx = !m_todo_idx; } bool done() const { return m_todo[m_todo_idx].empty(); } public: dataflow_engine(typename Fact::ctx_t& ctx, const rule_set& rules) : m_rules(rules), m_todo_idx(0), m_context(ctx) {} ~dataflow_engine() { for (auto & kv : m_body2rules) dealloc(kv.m_value); } void dump(std::ostream& outp) { obj_hashtable visited; for (rule const* r : m_rules) { func_decl* head_decl = r->get_decl(); obj_hashtable::entry *dummy; if (visited.insert_if_not_there_core(head_decl, dummy)) { const Fact& fact = m_facts.get(head_decl, Fact::null_fact); outp << head_decl->get_name() << " -> "; fact.dump(m_context, outp); outp << "\n"; } for (unsigned i = 0; i < r->get_uninterpreted_tail_size(); ++i) { func_decl *tail_decl = r->get_decl(i); if (visited.insert_if_not_there_core(tail_decl, dummy)) { const Fact& fact = m_facts.get(tail_decl, Fact::null_fact); outp << tail_decl->get_name() << " -> "; fact.dump(m_context, outp); outp << "\n"; } } } } void run_bottom_up() { init_bottom_up(); while (!done()) step_bottom_up(); } void run_top_down() { init_top_down(); while (!done()) step_top_down(); } const Fact& get_fact(func_decl* decl) const { return m_facts.get(decl, Fact::null_fact); } iterator begin() const { return m_facts.begin(); } iterator end() const { return m_facts.end(); } void join(const dataflow_engine& oth) { for (auto const& kv : oth.m_facts) { typename fact_db::entry* entry; if (m_facts.insert_if_not_there_core(kv.m_key, entry)) { entry->get_data().m_value = kv.m_value; } else { entry->get_data().m_value.join(m_context, kv.m_value); } } } void intersect(const dataflow_engine& oth) { ptr_vector to_delete; for (auto const& kv : m_facts) { if (typename fact_db::entry *entry = oth.m_facts.find_core(kv.m_key)) { kv.m_value.intersect(m_context, entry->get_data().m_value); } else { to_delete.push_back(kv.m_key); } } for (func_decl* f : to_delete) { m_facts.erase(f); } } }; // This helper-class is used to look up facts for rule tails template class fact_reader { typedef typename dataflow_engine::fact_db fact_db; const fact_db& m_facts; const rule* m_rule; public: fact_reader(const fact_db& facts, const rule* r) : m_facts(facts), m_rule(r) { } const Fact& get(unsigned idx) const { return m_facts.get(m_rule->get_decl(idx), Fact::null_fact); } unsigned size() const { return m_rule->get_positive_tail_size(); } }; template class fact_writer { friend class dataflow_engine; typedef typename dataflow_engine::fact_db fact_db; fact_db& m_facts; const rule* m_rule; typename dataflow_engine::todo_set& m_todo; public: fact_writer(fact_db& facts, const rule* r, typename dataflow_engine::todo_set& todo) : m_facts(facts), m_rule(r), m_todo(todo) {} Fact& get(unsigned idx) { func_decl *sym = m_rule->get_decl(idx); return m_facts.insert_if_not_there(sym, Fact()); } void set_changed(unsigned idx) { m_todo.insert(m_rule->get_decl(idx)); } unsigned size() const { return m_rule->get_uninterpreted_tail_size(); } }; }