// Copyright 2010-2025 Google LLC // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #ifndef ORTOOLS_UTIL_FILE_UTIL_H_ #define ORTOOLS_UTIL_FILE_UTIL_H_ #include #include #include "absl/log/check.h" #include "absl/status/statusor.h" #include "absl/strings/string_view.h" #include "google/protobuf/message.h" #include "ortools/base/file.h" #include "ortools/base/options.h" #include "ortools/base/recordio.h" #include "ortools/base/status_macros.h" namespace operations_research { // Reads a file, optionally gzipped, to a string. absl::StatusOr ReadFileToString(absl::string_view filename); // Reads a proto from a file. Supports the following formats: binary, text, // JSON, all of those optionally gzipped. Returns errors as expected: filesystem // error, parsing errors, or type error: maybe it was a valid JSON, text proto, // or binary proto, but not of the right proto message (this is not an exact // science, but the heuristics used should work well in practice). absl::Status ReadFileToProto( absl::string_view filename, google::protobuf::Message* proto, // If true, unset required fields don't cause errors. This // boolean doesn't work for JSON inputs. bool allow_partial = false); // Exactly like ReadFileToProto(), but directly from the contents. absl::Status StringToProto(absl::string_view data, google::protobuf::Message* proto, bool allow_partial = false); template absl::StatusOr ReadFileToProto(absl::string_view filename, bool allow_partial = false) { Proto proto; RETURN_IF_ERROR(ReadFileToProto(filename, &proto, allow_partial)) << "filename=" << filename; return proto; } // Specifies how the proto should be formatted when writing it to a file. // kCanonicalJson converts field names to lower camel-case. enum class ProtoWriteFormat { kProtoText, kProtoBinary, kJson, kCanonicalJson }; // Writes a proto to a file. Supports the following formats: binary, text, JSON, // all of those optionally gzipped. // If 'proto_write_format' is kProtoBinary, ".bin" is appended to file_name. If // 'proto_write_format' is kJson or kCanonicalJson, ".json" is appended to // file_name. If 'gzipped' is true, ".gz" is appended to file_name. absl::Status WriteProtoToFile(absl::string_view filename, const google::protobuf::Message& proto, ProtoWriteFormat proto_write_format, bool gzipped = false, bool append_extension_to_file_name = true); namespace internal { // General method to read expected_num_records from a file. If // expected_num_records is -1, then reads all records from the file. If not, // dies if the file doesn't contain exactly expected_num_records. template std::vector ReadNumRecords(File* file, int expected_num_records) { recordio::RecordReader reader(file); std::vector protos; Proto proto; int num_read = 0; while (num_read != expected_num_records && reader.ReadProtocolMessage(&proto)) { protos.push_back(proto); ++num_read; } CHECK(reader.Close()) << "File '" << file->filename() << "'was not fully read, or something went wrong when closing " "it. Is it the right format? (RecordIO of Protocol Buffers)."; if (expected_num_records >= 0) { CHECK_EQ(num_read, expected_num_records) << "There were less than the expected " << expected_num_records << " in the file."; } return protos; } // Ditto, taking a filename as argument. template std::vector ReadNumRecords(absl::string_view filename, int expected_num_records) { return ReadNumRecords(file::OpenOrDie(filename, "r", file::Defaults()), expected_num_records); } } // namespace internal // Reads all records in Proto format in 'file'. Silently does nothing if the // file is empty. Dies if the file doesn't exist or contains something else than // protos encoded in RecordIO format. template std::vector ReadAllRecordsOrDie(absl::string_view filename) { return internal::ReadNumRecords(filename, -1); } template std::vector ReadAllRecordsOrDie(File* file) { return internal::ReadNumRecords(file, -1); } // Reads one record from file, which must be in RecordIO binary proto format. // Dies if the file can't be read, doesn't contain exactly one record, or // contains something else than the expected proto in RecordIO format. template Proto ReadOneRecordOrDie(absl::string_view filename) { Proto p; p.Swap(&internal::ReadNumRecords(filename, 1)[0]); return p; } // Writes all records in Proto format to 'file'. Dies if it is unable to open // the file or write to it. template void WriteRecordsOrDie(absl::string_view filename, const std::vector& protos) { recordio::RecordWriter writer( file::OpenOrDie(filename, "w", file::Defaults())); for (const Proto& proto : protos) { CHECK(writer.WriteProtocolMessage(proto)); } CHECK(writer.Close()); } } // namespace operations_research #endif // ORTOOLS_UTIL_FILE_UTIL_H_