Files
ortools-clone/examples/cpp/sat_cnf_reader.h
2021-04-02 10:08:51 +02:00

341 lines
11 KiB
C++

// Copyright 2010-2021 Google LLC
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#ifndef OR_TOOLS_SAT_SAT_CNF_READER_H_
#define OR_TOOLS_SAT_SAT_CNF_READER_H_
#include <map>
#include <memory>
#include <string>
#include <utility>
#include <vector>
#include "absl/strings/numbers.h"
#include "absl/strings/str_split.h"
#include "absl/strings/string_view.h"
#include "absl/types/span.h"
#include "ortools/base/commandlineflags.h"
#include "ortools/base/filelineiter.h"
#include "ortools/base/integral_types.h"
#include "ortools/base/logging.h"
#include "ortools/base/macros.h"
#include "ortools/sat/boolean_problem.pb.h"
#include "ortools/sat/cp_model.pb.h"
ABSL_FLAG(bool, wcnf_use_strong_slack, true,
"If true, when we add a slack variable to reify a soft clause, we "
"enforce the fact that when it is true, the clause must be false.");
namespace operations_research {
namespace sat {
struct LinearBooleanProblemWrapper {
explicit LinearBooleanProblemWrapper(LinearBooleanProblem* p) : problem(p) {}
void SetNumVariables(int num) { problem->set_num_variables(num); }
void SetOriginalNumVariables(int num) {
problem->set_original_num_variables(num);
}
void AddConstraint(absl::Span<const int> clause) {
LinearBooleanConstraint* constraint = problem->add_constraints();
constraint->mutable_literals()->Reserve(clause.size());
constraint->mutable_coefficients()->Reserve(clause.size());
constraint->set_lower_bound(1);
for (const int literal : clause) {
constraint->add_literals(literal);
constraint->add_coefficients(1);
}
}
void AddObjectiveTerm(int literal, int64 value) {
CHECK_GE(literal, 0) << "Negative literal not supported.";
problem->mutable_objective()->add_literals(literal);
problem->mutable_objective()->add_coefficients(value);
}
void SetObjectiveOffset(int64 offset) {
problem->mutable_objective()->set_offset(offset);
}
LinearBooleanProblem* problem;
};
struct CpModelProtoWrapper {
explicit CpModelProtoWrapper(CpModelProto* p) : problem(p) {}
void SetNumVariables(int num) {
for (int i = 0; i < num; ++i) {
IntegerVariableProto* variable = problem->add_variables();
variable->add_domain(0);
variable->add_domain(1);
}
}
// TODO(user): Not supported. This is only used for displaying a wcnf
// solution in cnf format, so it is not useful internally. Instead of adding
// another field, we could use the variables names or the search heuristics
// to encode this info.
void SetOriginalNumVariables(int num) {}
int LiteralToRef(int signed_value) {
return signed_value > 0 ? signed_value - 1 : signed_value;
}
void AddConstraint(absl::Span<const int> clause) {
auto* constraint = problem->add_constraints()->mutable_bool_or();
constraint->mutable_literals()->Reserve(clause.size());
for (const int literal : clause) {
constraint->add_literals(LiteralToRef(literal));
}
}
void AddObjectiveTerm(int literal, int64 value) {
CHECK_GE(literal, 0) << "Negative literal not supported.";
problem->mutable_objective()->add_vars(LiteralToRef(literal));
problem->mutable_objective()->add_coeffs(value);
}
void SetObjectiveOffset(int64 offset) {
problem->mutable_objective()->set_offset(offset);
}
CpModelProto* problem;
};
// This class loads a file in cnf file format into a SatProblem.
// The format is described here:
// http://people.sc.fsu.edu/~jburkardt/data/cnf/cnf.html
//
// It also support the wcnf input format for partial weighted max-sat problems.
class SatCnfReader {
public:
SatCnfReader() : interpret_cnf_as_max_sat_(false) {}
// If called with true, then a cnf file will be converted to the max-sat
// problem: Try to minimize the number of unsatisfiable clauses.
void InterpretCnfAsMaxSat(bool v) { interpret_cnf_as_max_sat_ = v; }
// Loads the given cnf filename into the given proto.
bool Load(const std::string& filename, LinearBooleanProblem* problem) {
problem->Clear();
problem->set_name(ExtractProblemName(filename));
LinearBooleanProblemWrapper wrapper(problem);
return LoadInternal(filename, &wrapper);
}
bool Load(const std::string& filename, CpModelProto* problem) {
problem->Clear();
problem->set_name(ExtractProblemName(filename));
CpModelProtoWrapper wrapper(problem);
return LoadInternal(filename, &wrapper);
}
private:
template <class Problem>
bool LoadInternal(const std::string& filename, Problem* problem) {
positive_literal_to_weight_.clear();
objective_offset_ = 0;
is_wcnf_ = false;
end_marker_seen_ = false;
hard_weight_ = 0;
num_skipped_soft_clauses_ = 0;
num_singleton_soft_clauses_ = 0;
num_added_clauses_ = 0;
num_slack_variables_ = 0;
int num_lines = 0;
for (const std::string& line : FileLines(filename)) {
++num_lines;
ProcessNewLine(line, problem);
}
if (num_lines == 0) {
LOG(FATAL) << "File '" << filename << "' is empty or can't be read.";
}
problem->SetOriginalNumVariables(num_variables_);
problem->SetNumVariables(num_variables_ + num_slack_variables_);
// Fill the objective.
if (!positive_literal_to_weight_.empty()) {
for (const std::pair<int, int64> p : positive_literal_to_weight_) {
if (p.second != 0) {
problem->AddObjectiveTerm(p.first, p.second);
}
}
problem->SetObjectiveOffset(objective_offset_);
}
if (num_clauses_ != num_added_clauses_ + num_singleton_soft_clauses_ +
num_skipped_soft_clauses_) {
LOG(ERROR) << "Wrong number of clauses. " << num_clauses_ << " "
<< num_added_clauses_;
return false;
}
return true;
}
// Since the problem name is not stored in the cnf format, we infer it from
// the file name.
static std::string ExtractProblemName(const std::string& filename) {
const int found = filename.find_last_of('/');
const std::string problem_name =
found != std::string::npos ? filename.substr(found + 1) : filename;
return problem_name;
}
int64 StringPieceAtoi(absl::string_view input) {
int64 value;
// Hack: data() is not null terminated, but we do know that it points
// inside a string where numbers are separated by " " and since SimpleAtoi
// will stop at the first invalid char, this works.
CHECK(absl::SimpleAtoi(input, &value));
return value;
}
void ProcessHeader(const std::string& line) {
static const char kWordDelimiters[] = " ";
words_ = absl::StrSplit(line, kWordDelimiters, absl::SkipEmpty());
CHECK_EQ(words_[0], "p");
if (words_[1] == "cnf" || words_[1] == "wcnf") {
num_variables_ = StringPieceAtoi(words_[2]);
num_clauses_ = StringPieceAtoi(words_[3]);
if (words_[1] == "wcnf") {
is_wcnf_ = true;
hard_weight_ = (words_.size() > 4) ? StringPieceAtoi(words_[4]) : 0;
}
} else {
// TODO(user): The ToString() is only required for the open source. Fix.
LOG(FATAL) << "Unknown file type: " << words_[1];
}
}
template <class Problem>
void ProcessNewLine(const std::string& line, Problem* problem) {
if (line.empty() || end_marker_seen_) return;
if (line[0] == 'c') return;
if (line[0] == '%') {
end_marker_seen_ = true;
return;
}
if (line[0] == 'p') {
ProcessHeader(line);
return;
}
static const char kWordDelimiters[] = " ";
auto splitter = absl::StrSplit(line, kWordDelimiters, absl::SkipEmpty());
tmp_clause_.clear();
int64 weight = (!is_wcnf_ && interpret_cnf_as_max_sat_) ? 1 : hard_weight_;
bool first = true;
bool end_marker_seen = false;
for (const absl::string_view word : splitter) {
const int64 signed_value = StringPieceAtoi(word);
if (first && is_wcnf_) {
// Mathematically, a soft clause of weight 0 can be removed.
if (signed_value == 0) {
++num_skipped_soft_clauses_;
return;
}
weight = signed_value;
} else {
if (signed_value == 0) {
end_marker_seen = true;
break; // end of clause.
}
tmp_clause_.push_back(signed_value);
}
first = false;
}
if (!end_marker_seen) return;
if (weight == hard_weight_) {
++num_added_clauses_;
problem->AddConstraint(tmp_clause_);
} else {
if (tmp_clause_.size() == 1) {
// The max-sat formulation of an optimization sat problem with a
// linear objective introduces many singleton soft clauses. Because we
// natively work with a linear objective, we can just add the cost to
// the unique variable of such clause and remove the clause.
++num_singleton_soft_clauses_;
const int literal = -tmp_clause_[0];
if (literal > 0) {
positive_literal_to_weight_[literal] += weight;
} else {
positive_literal_to_weight_[-literal] -= weight;
objective_offset_ += weight;
}
} else {
// The +1 is because a positive literal is the same as the 1-based
// variable index.
const int slack_literal = num_variables_ + num_slack_variables_ + 1;
++num_slack_variables_;
tmp_clause_.push_back(slack_literal);
++num_added_clauses_;
problem->AddConstraint(tmp_clause_);
if (slack_literal > 0) {
positive_literal_to_weight_[slack_literal] += weight;
} else {
positive_literal_to_weight_[-slack_literal] -= weight;
objective_offset_ += weight;
}
if (absl::GetFlag(FLAGS_wcnf_use_strong_slack)) {
// Add the binary implications slack_literal true => all the other
// clause literals are false.
for (int i = 0; i + 1 < tmp_clause_.size(); ++i) {
problem->AddConstraint({-slack_literal, -tmp_clause_[i]});
}
}
}
}
}
bool interpret_cnf_as_max_sat_;
int num_clauses_;
int num_variables_;
// Temporary storage for ProcessNewLine().
std::vector<absl::string_view> words_;
// We stores the objective in a map because we want the variables to appear
// only once in the LinearObjective proto.
std::map<int, int64> positive_literal_to_weight_;
int64 objective_offset_;
// Used for the wcnf format.
bool is_wcnf_;
// Some files have text after %. This indicates if we have seen the '%'.
bool end_marker_seen_;
int64 hard_weight_;
int num_slack_variables_;
int num_skipped_soft_clauses_;
int num_singleton_soft_clauses_;
int num_added_clauses_;
std::vector<int> tmp_clause_;
DISALLOW_COPY_AND_ASSIGN(SatCnfReader);
};
} // namespace sat
} // namespace operations_research
#endif // OR_TOOLS_SAT_SAT_CNF_READER_H_