3
0
Fork 0
mirror of https://github.com/Z3Prover/z3 synced 2025-04-06 17:44:08 +00:00

fill in missing pieces of proof hint checker for Farkas and RUP

The proof validator based on SMT format proof logs uses RUP to check propositional inferences and has plugins for theory axioms/lemmas.
This commit is contained in:
Nikolaj Bjorner 2022-08-31 05:29:15 -07:00
parent d2b618df23
commit 4abff18e8d
6 changed files with 99 additions and 33 deletions

View file

@ -15,28 +15,51 @@ Author:
Notes: Notes:
- add theory hint bypass using proof checker plugins of SMT Proof checker for clauses created during search.
- arith_proof_checker.h is currently 1. Clauses annotated by RUP (reverse unit propagation)
- could use m_drat for drup premises. are checked to be inferrable using reverse unit propagation
based on previous clauses.
2. Clauses annotated by supported proof rules (proof hints)
are checked by custom proof checkers. There is a proof checker
for each proof rule. Main proof checkers just have a single step
but the framework allows to compose proof rules, each inference
is checked for correctness by a plugin.
3. When there are no supported plugin to justify the derived
clause, or a custom check fails, the fallback is to check that the
derived clause is a consequence of the input clauses using SMT.
The last approach is a bail-out and offers a weaker notion of
self-validation. It is often (but not always) sufficient for using proof
checking for debugging, as the root-cause for an unsound inference in z3
does not necessarily manifest when checking the conclusion of the
inference. An external proof checker that uses such fallbacks could
use several solvers, or bootstrap from a solver that can generate certificates
when z3 does not.
--*/ --*/
#include "util/small_object_allocator.h" #include "util/small_object_allocator.h"
#include "ast/ast_util.h" #include "ast/ast_util.h"
#include "cmd_context/cmd_context.h"
#include "smt/smt_solver.h" #include "smt/smt_solver.h"
#include "sat/sat_solver.h" #include "sat/sat_solver.h"
#include "sat/sat_drat.h" #include "sat/sat_drat.h"
#include "sat/smt/euf_proof_checker.h" #include "sat/smt/euf_proof_checker.h"
#include "cmd_context/cmd_context.h"
#include <iostream> #include <iostream>
class smt_checker { class smt_checker {
ast_manager& m; ast_manager& m;
params_ref m_params; params_ref m_params;
// for checking proof rules (hints)
euf::proof_checker m_checker; euf::proof_checker m_checker;
// for fallback SMT checker
scoped_ptr<solver> m_solver; scoped_ptr<solver> m_solver;
// for RUP
symbol m_rup; symbol m_rup;
sat::solver m_sat_solver; sat::solver m_sat_solver;
sat::drat m_drat; sat::drat m_drat;
@ -63,11 +86,10 @@ public:
m_rup = symbol("rup"); m_rup = symbol("rup");
} }
bool is_rup(expr* proof_hint) { bool is_rup(app* proof_hint) {
return return
proof_hint && proof_hint &&
is_app(proof_hint) && proof_hint->get_name() == m_rup;
to_app(proof_hint)->get_name() == m_rup;
} }
void mk_clause(expr_ref_vector const& clause) { void mk_clause(expr_ref_vector const& clause) {
@ -79,6 +101,14 @@ public:
m_clause.push_back(sat::literal(e->get_id(), sign)); m_clause.push_back(sat::literal(e->get_id(), sign));
} }
} }
void mk_clause(expr* e) {
m_clause.reset();
bool sign = false;
while (m.is_not(e, e))
sign = !sign;
m_clause.push_back(sat::literal(e->get_id(), sign));
}
bool check_rup(expr_ref_vector const& clause) { bool check_rup(expr_ref_vector const& clause) {
add_units(); add_units();
@ -86,25 +116,38 @@ public:
return m_drat.is_drup(m_clause.size(), m_clause.data(), m_units); return m_drat.is_drup(m_clause.size(), m_clause.data(), m_units);
} }
bool check_rup(expr* u) {
add_units();
mk_clause(u);
return m_drat.is_drup(m_clause.size(), m_clause.data(), m_units);
}
void add_clause(expr_ref_vector const& clause) { void add_clause(expr_ref_vector const& clause) {
mk_clause(clause); mk_clause(clause);
m_drat.add(m_clause, sat::status::input()); m_drat.add(m_clause, sat::status::input());
} }
void check(expr_ref_vector const& clause, expr* proof_hint) { void check(expr_ref_vector& clause, app* proof_hint) {
if (is_rup(proof_hint) && check_rup(clause)) { if (is_rup(proof_hint) && check_rup(clause)) {
std::cout << "(verified-rup)\n"; std::cout << "(verified-rup)\n";
return; return;
} }
if (m_checker.check(clause, proof_hint)) { expr_ref_vector units(m);
if (is_app(proof_hint)) if (m_checker.check(clause, proof_hint, units)) {
std::cout << "(verified-" << to_app(proof_hint)->get_name() << ")\n"; bool units_are_rup = true;
else for (expr* u : units) {
std::cout << "(verified-checker)\n"; if (!check_rup(u)) {
return; std::cout << "unit " << mk_pp(u, m) << " is not rup\n";
units_are_rup = false;
}
}
if (units_are_rup) {
std::cout << "(verified-" << proof_hint->get_name() << ")\n";
add_clause(clause);
return;
}
} }
m_solver->push(); m_solver->push();
@ -123,7 +166,7 @@ public:
} }
m_solver->pop(1); m_solver->pop(1);
std::cout << "(verified-smt)\n"; std::cout << "(verified-smt)\n";
// assume(clause); add_clause(clause);
} }
void assume(expr_ref_vector const& clause) { void assume(expr_ref_vector const& clause) {
@ -135,14 +178,14 @@ public:
class proof_cmds_imp : public proof_cmds { class proof_cmds_imp : public proof_cmds {
ast_manager& m; ast_manager& m;
expr_ref_vector m_lits; expr_ref_vector m_lits;
expr_ref m_proof_hint; app_ref m_proof_hint;
smt_checker m_checker; smt_checker m_checker;
public: public:
proof_cmds_imp(ast_manager& m): m(m), m_lits(m), m_proof_hint(m), m_checker(m) {} proof_cmds_imp(ast_manager& m): m(m), m_lits(m), m_proof_hint(m), m_checker(m) {}
void add_literal(expr* e) override { void add_literal(expr* e) override {
if (m.is_proof(e)) if (m.is_proof(e))
m_proof_hint = e; m_proof_hint = to_app(e);
else else
m_lits.push_back(e); m_lits.push_back(e);
} }

View file

@ -416,6 +416,8 @@ namespace sat {
void drat::verify(unsigned n, literal const* c) { void drat::verify(unsigned n, literal const* c) {
if (!m_check_unsat) if (!m_check_unsat)
return; return;
if (m_inconsistent)
return;
for (unsigned i = 0; i < n; ++i) for (unsigned i = 0; i < n; ++i)
declare(c[i]); declare(c[i]);
if (is_drup(n, c)) { if (is_drup(n, c)) {
@ -690,7 +692,7 @@ namespace sat {
++m_stats.m_num_add; ++m_stats.m_num_add;
if (m_check) { if (m_check) {
switch (sz) { switch (sz) {
case 0: add(); break; case 0: if (st.is_input()) m_inconsistent = true; else add(); break;
case 1: append(lits[0], st); break; case 1: append(lits[0], st); break;
default: append(mk_clause(sz, lits, st.is_redundant()), st); break; default: append(mk_clause(sz, lits, st.is_redundant()), st); break;
} }

View file

@ -140,11 +140,13 @@ namespace arith {
SASSERT(m_todo.empty()); SASSERT(m_todo.empty());
m_todo.push_back({ mul, e }); m_todo.push_back({ mul, e });
rational coeff1; rational coeff1;
expr* e1, *e2; expr* e1, *e2, *e3;
for (unsigned i = 0; i < m_todo.size(); ++i) { for (unsigned i = 0; i < m_todo.size(); ++i) {
auto [coeff, e] = m_todo[i]; auto [coeff, e] = m_todo[i];
if (a.is_mul(e, e1, e2) && a.is_numeral(e1, coeff1)) if (a.is_mul(e, e1, e2) && a.is_numeral(e1, coeff1))
m_todo.push_back({coeff*coeff1, e2}); m_todo.push_back({coeff*coeff1, e2});
else if (a.is_mul(e, e1, e2) && a.is_uminus(e1, e3) && a.is_numeral(e3, coeff1))
m_todo.push_back({-coeff*coeff1, e2});
else if (a.is_mul(e, e1, e2) && a.is_numeral(e2, coeff1)) else if (a.is_mul(e, e1, e2) && a.is_numeral(e2, coeff1))
m_todo.push_back({coeff*coeff1, e1}); m_todo.push_back({coeff*coeff1, e1});
else if (a.is_add(e)) else if (a.is_add(e))
@ -158,6 +160,8 @@ namespace arith {
} }
else if (a.is_numeral(e, coeff1)) else if (a.is_numeral(e, coeff1))
r.m_coeff += coeff*coeff1; r.m_coeff += coeff*coeff1;
else if (a.is_uminus(e, e1) && a.is_numeral(e1, coeff1))
r.m_coeff -= coeff*coeff1;
else else
add(r, e, coeff); add(r, e, coeff);
} }
@ -361,8 +365,14 @@ namespace arith {
return out; return out;
} }
bool check(expr_ref_vector const& clause, app* jst) override { bool check(expr_ref_vector const& clause, app* jst, expr_ref_vector& units) override {
reset(); reset();
expr_mark pos, neg;
for (expr* e : clause)
if (m.is_not(e, e))
neg.mark(e, true);
else
pos.mark(e, true);
if (jst->get_name() == symbol("farkas")) { if (jst->get_name() == symbol("farkas")) {
bool even = true; bool even = true;
@ -387,13 +397,24 @@ namespace arith {
} }
else else
return false; return false;
if (sign && !pos.is_marked(arg)) {
units.push_back(m.mk_not(arg));
pos.mark(arg, false);
}
else if (!sign && !neg.is_marked(arg)) {
units.push_back(arg);
neg.mark(arg, false);
}
} }
even = !even; even = !even;
} }
if (check_farkas()) if (check_farkas()) {
return true; return true;
}
IF_VERBOSE(0, verbose_stream() << "did not check farkas\n" << mk_pp(jst, m) << "\n"); IF_VERBOSE(0, verbose_stream() << "did not check farkas\n" << mk_pp(jst, m) << "\n"; display(verbose_stream()); );
return false; return false;
} }

View file

@ -35,13 +35,14 @@ namespace euf {
m_map.insert(rule, p); m_map.insert(rule, p);
} }
bool proof_checker::check(expr_ref_vector const& clause, expr* e) { bool proof_checker::check(expr_ref_vector const& clause, expr* e, expr_ref_vector& units) {
if (!e || !is_app(e)) if (!e || !is_app(e))
return false; return false;
units.reset();
app* a = to_app(e); app* a = to_app(e);
proof_checker_plugin* p = nullptr; proof_checker_plugin* p = nullptr;
if (m_map.find(a->get_decl()->get_name(), p)) if (m_map.find(a->get_decl()->get_name(), p))
return p->check(clause, a); return p->check(clause, a, units);
return false; return false;
} }

View file

@ -27,7 +27,7 @@ namespace euf {
class proof_checker_plugin { class proof_checker_plugin {
public: public:
virtual ~proof_checker_plugin() {} virtual ~proof_checker_plugin() {}
virtual bool check(expr_ref_vector const& clause, app* jst) = 0; virtual bool check(expr_ref_vector const& clause, app* jst, expr_ref_vector& units) = 0;
virtual void register_plugins(proof_checker& pc) = 0; virtual void register_plugins(proof_checker& pc) = 0;
}; };
@ -39,7 +39,7 @@ namespace euf {
proof_checker(ast_manager& m); proof_checker(ast_manager& m);
~proof_checker(); ~proof_checker();
void register_plugin(symbol const& rule, proof_checker_plugin*); void register_plugin(symbol const& rule, proof_checker_plugin*);
bool check(expr_ref_vector const& clause, expr* e); bool check(expr_ref_vector const& clause, expr* e, expr_ref_vector& units);
}; };
} }

View file

@ -255,9 +255,8 @@ namespace smt {
return false; return false;
ptr_vector<sort> sorts(f->get_arity(), f->get_domain()); ptr_vector<sort> sorts(f->get_arity(), f->get_domain());
svector<symbol> names; svector<symbol> names;
for (unsigned i = 0; i < f->get_arity(); ++i) { for (unsigned i = 0; i < f->get_arity(); ++i)
names.push_back(symbol(i)); names.push_back(symbol(i));
}
defined_names dn(m); defined_names dn(m);
body = replace_value_from_ctx(body); body = replace_value_from_ctx(body);
body = m.mk_lambda(sorts.size(), sorts.data(), names.data(), body); body = m.mk_lambda(sorts.size(), sorts.data(), names.data(), body);
@ -575,16 +574,16 @@ namespace smt {
for (unsigned i = 0; i < n; ++i) { for (unsigned i = 0; i < n; ++i) {
proof* pr = nullptr; proof* pr = nullptr;
expr* arg = args[i]; expr* arg = args[i];
if (m.proofs_enabled()) { if (m.proofs_enabled())
pr = m.mk_def_intro(arg); pr = m.mk_def_intro(arg);
}
m_context->internalize_assertion(arg, pr, gen); m_context->internalize_assertion(arg, pr, gen);
} }
} }
TRACE("model_checker_bug_detail", tout << "instantiating... q:\n" << mk_pp(q, m) << "\n"; TRACE("model_checker_bug_detail", tout << "instantiating... q:\n" << mk_pp(q, m) << "\n";
tout << "inconsistent: " << m_context->inconsistent() << "\n"; tout << "inconsistent: " << m_context->inconsistent() << "\n";
tout << "bindings:\n" << expr_ref_vector(m, num_decls, m_pinned_exprs.data() + offset) << "\n";); tout << "bindings:\n" << expr_ref_vector(m, num_decls, m_pinned_exprs.data() + offset) << "\n";
tout << "def " << mk_pp(inst.m_def, m) << "\n";);
m_context->add_instance(q, nullptr, num_decls, bindings.data(), inst.m_def, gen, gen, gen, dummy); m_context->add_instance(q, nullptr, num_decls, bindings.data(), inst.m_def, gen, gen, gen, dummy);
TRACE("model_checker_bug_detail", tout << "after instantiating, inconsistent: " << m_context->inconsistent() << "\n";); TRACE("model_checker_bug_detail", tout << "after instantiating, inconsistent: " << m_context->inconsistent() << "\n";);
} }