blob: 5671a3faf9e0abc3c5521e3e1fc9a77615f69c0c [file] [log] [blame]
Austin Schuhb06f03b2021-02-17 22:00:37 -08001#include "aos/events/logging/log_writer.h"
2
Austin Schuh6bb8a822021-03-31 23:04:39 -07003#include <dirent.h>
4
Austin Schuhb06f03b2021-02-17 22:00:37 -08005#include <functional>
6#include <map>
7#include <vector>
8
9#include "aos/configuration.h"
10#include "aos/events/event_loop.h"
11#include "aos/network/message_bridge_server_generated.h"
12#include "aos/network/team_number.h"
Austin Schuh61e973f2021-02-21 21:43:56 -080013#include "aos/network/timestamp_channel.h"
Austin Schuhb06f03b2021-02-17 22:00:37 -080014
15namespace aos {
16namespace logger {
17namespace {
18using message_bridge::RemoteMessage;
Austin Schuhbd06ae42021-03-31 22:48:21 -070019namespace chrono = std::chrono;
Austin Schuhb06f03b2021-02-17 22:00:37 -080020} // namespace
21
22Logger::Logger(EventLoop *event_loop, const Configuration *configuration,
23 std::function<bool(const Channel *)> should_log)
24 : event_loop_(event_loop),
25 configuration_(configuration),
Austin Schuh5b728b72021-06-16 14:57:15 -070026 node_(configuration::GetNode(configuration_, event_loop->node())),
27 node_index_(configuration::GetNodeIndex(configuration_, node_)),
Austin Schuhb06f03b2021-02-17 22:00:37 -080028 name_(network::GetHostname()),
29 timer_handler_(event_loop_->AddTimer(
Austin Schuh30586902021-03-30 22:54:08 -070030 [this]() { DoLogData(event_loop_->monotonic_now(), true); })),
Austin Schuhb06f03b2021-02-17 22:00:37 -080031 server_statistics_fetcher_(
32 configuration::MultiNode(event_loop_->configuration())
33 ? event_loop_->MakeFetcher<message_bridge::ServerStatistics>(
34 "/aos")
35 : aos::Fetcher<message_bridge::ServerStatistics>()) {
Austin Schuh58646e22021-08-23 23:51:46 -070036 timer_handler_->set_name("channel_poll");
Austin Schuh5b728b72021-06-16 14:57:15 -070037 VLOG(1) << "Creating logger for " << FlatbufferToJson(node_);
Austin Schuhb06f03b2021-02-17 22:00:37 -080038
Naman Gupta41d70c22022-11-21 15:29:52 -080039 // When we are logging remote timestamps, we need to be able to translate
40 // from the channel index that the event loop uses to the channel index in
41 // the config in the log file.
Austin Schuh01f3b392022-01-25 20:03:09 -080042 event_loop_to_logged_channel_index_.resize(
43 event_loop->configuration()->channels()->size(), -1);
44 for (size_t event_loop_channel_index = 0;
45 event_loop_channel_index <
46 event_loop->configuration()->channels()->size();
47 ++event_loop_channel_index) {
48 const Channel *event_loop_channel =
49 event_loop->configuration()->channels()->Get(event_loop_channel_index);
50
51 const Channel *logged_channel = aos::configuration::GetChannel(
52 configuration_, event_loop_channel->name()->string_view(),
53 event_loop_channel->type()->string_view(), "", node_);
54
55 if (logged_channel != nullptr) {
56 event_loop_to_logged_channel_index_[event_loop_channel_index] =
57 configuration::ChannelIndex(configuration_, logged_channel);
58 }
59 }
60
61 // Map to match source channels with the timestamp logger, if the contents
62 // should be reliable, and a list of all channels logged on it to be treated
63 // as reliable.
64 std::map<const Channel *, std::tuple<const Node *, bool, std::vector<bool>>>
65 timestamp_logger_channels;
Austin Schuhb06f03b2021-02-17 22:00:37 -080066
Austin Schuh61e973f2021-02-21 21:43:56 -080067 message_bridge::ChannelTimestampFinder finder(event_loop_);
68 for (const Channel *channel : *event_loop_->configuration()->channels()) {
69 if (!configuration::ChannelIsSendableOnNode(channel, event_loop_->node())) {
Austin Schuhb06f03b2021-02-17 22:00:37 -080070 continue;
71 }
Austin Schuh61e973f2021-02-21 21:43:56 -080072 if (!channel->has_destination_nodes()) {
73 continue;
74 }
Austin Schuh01f3b392022-01-25 20:03:09 -080075 const size_t channel_index =
76 configuration::ChannelIndex(event_loop_->configuration(), channel);
77
Austin Schuh61e973f2021-02-21 21:43:56 -080078 for (const Connection *connection : *channel->destination_nodes()) {
79 if (configuration::ConnectionDeliveryTimeIsLoggedOnNode(
80 connection, event_loop_->node())) {
81 const Node *other_node = configuration::GetNode(
Austin Schuh5b728b72021-06-16 14:57:15 -070082 configuration_, connection->name()->string_view());
Austin Schuh61e973f2021-02-21 21:43:56 -080083
84 VLOG(1) << "Timestamps are logged from "
85 << FlatbufferToJson(other_node);
Austin Schuh01f3b392022-01-25 20:03:09 -080086 // True if each channel's remote timestamps are split into a separate
87 // RemoteMessage channel.
88 const bool is_split =
89 finder.SplitChannelForChannel(channel, connection) != nullptr;
90
91 const Channel *const timestamp_logger_channel =
92 finder.ForChannel(channel, connection);
93
94 auto it = timestamp_logger_channels.find(timestamp_logger_channel);
95 if (it != timestamp_logger_channels.end()) {
96 CHECK(!is_split);
97 CHECK_LT(channel_index, std::get<2>(it->second).size());
Brian Smartt796cca02022-04-12 15:07:21 -070098 std::get<2>(it->second)[channel_index] =
99 (connection->time_to_live() == 0);
Austin Schuh01f3b392022-01-25 20:03:09 -0800100 } else {
101 if (is_split) {
102 timestamp_logger_channels.insert(std::make_pair(
103 timestamp_logger_channel,
104 std::make_tuple(other_node, (connection->time_to_live() == 0),
105 std::vector<bool>())));
106 } else {
107 std::vector<bool> channel_reliable_contents(
108 event_loop->configuration()->channels()->size(), false);
109 channel_reliable_contents[channel_index] =
110 (connection->time_to_live() == 0);
111
112 timestamp_logger_channels.insert(std::make_pair(
113 timestamp_logger_channel,
114 std::make_tuple(other_node, false,
115 std::move(channel_reliable_contents))));
116 }
117 }
Austin Schuh61e973f2021-02-21 21:43:56 -0800118 }
119 }
Austin Schuhb06f03b2021-02-17 22:00:37 -0800120 }
121
Austin Schuhb06f03b2021-02-17 22:00:37 -0800122 for (size_t channel_index = 0;
123 channel_index < configuration_->channels()->size(); ++channel_index) {
124 const Channel *const config_channel =
125 configuration_->channels()->Get(channel_index);
126 // The MakeRawFetcher method needs a channel which is in the event loop
127 // configuration() object, not the configuration_ object. Go look that up
128 // from the config.
129 const Channel *channel = aos::configuration::GetChannel(
130 event_loop_->configuration(), config_channel->name()->string_view(),
131 config_channel->type()->string_view(), "", event_loop_->node());
132 CHECK(channel != nullptr)
133 << ": Failed to look up channel "
134 << aos::configuration::CleanedChannelToString(config_channel);
Austin Schuh5b728b72021-06-16 14:57:15 -0700135 if (!should_log(config_channel)) {
Austin Schuhb06f03b2021-02-17 22:00:37 -0800136 continue;
137 }
138
139 FetcherStruct fs;
140 fs.channel_index = channel_index;
141 fs.channel = channel;
142
143 const bool is_local =
Austin Schuh5b728b72021-06-16 14:57:15 -0700144 configuration::ChannelIsSendableOnNode(config_channel, node_);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800145
146 const bool is_readable =
Austin Schuh5b728b72021-06-16 14:57:15 -0700147 configuration::ChannelIsReadableOnNode(config_channel, node_);
Austin Schuh01f3b392022-01-25 20:03:09 -0800148 const bool is_logged =
149 configuration::ChannelMessageIsLoggedOnNode(config_channel, node_);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800150 const bool log_message = is_logged && is_readable;
151
152 bool log_delivery_times = false;
Austin Schuh5b728b72021-06-16 14:57:15 -0700153 if (configuration::MultiNode(configuration_)) {
Austin Schuh72211ae2021-08-05 14:02:30 -0700154 const aos::Connection *connection =
Austin Schuh5b728b72021-06-16 14:57:15 -0700155 configuration::ConnectionToNode(config_channel, node_);
Austin Schuh72211ae2021-08-05 14:02:30 -0700156
Austin Schuhb06f03b2021-02-17 22:00:37 -0800157 log_delivery_times = configuration::ConnectionDeliveryTimeIsLoggedOnNode(
Austin Schuh72211ae2021-08-05 14:02:30 -0700158 connection, event_loop_->node());
159
160 CHECK_EQ(log_delivery_times,
161 configuration::ConnectionDeliveryTimeIsLoggedOnNode(
Austin Schuh5b728b72021-06-16 14:57:15 -0700162 config_channel, node_, node_));
Austin Schuh72211ae2021-08-05 14:02:30 -0700163
164 if (connection) {
165 fs.reliable_forwarding = (connection->time_to_live() == 0);
166 }
Austin Schuhb06f03b2021-02-17 22:00:37 -0800167 }
168
Austin Schuh01f3b392022-01-25 20:03:09 -0800169 // Now, detect a RemoteMessage timestamp logger where we should just log
170 // the contents to a file directly.
Austin Schuhb06f03b2021-02-17 22:00:37 -0800171 const bool log_contents = timestamp_logger_channels.find(channel) !=
172 timestamp_logger_channels.end();
173
174 if (log_message || log_delivery_times || log_contents) {
175 fs.fetcher = event_loop->MakeRawFetcher(channel);
176 VLOG(1) << "Logging channel "
177 << configuration::CleanedChannelToString(channel);
178
179 if (log_delivery_times) {
180 VLOG(1) << " Delivery times";
181 fs.wants_timestamp_writer = true;
Austin Schuh5b728b72021-06-16 14:57:15 -0700182 fs.timestamp_node_index = static_cast<int>(node_index_);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800183 }
Austin Schuhe46492f2021-07-31 19:49:41 -0700184 // Both the timestamp and data writers want data_node_index so it knows
185 // what the source node is.
186 if (log_message || log_delivery_times) {
Austin Schuhb06f03b2021-02-17 22:00:37 -0800187 if (!is_local) {
188 const Node *source_node = configuration::GetNode(
189 configuration_, channel->source_node()->string_view());
190 fs.data_node_index =
191 configuration::GetNodeIndex(configuration_, source_node);
Austin Schuhe46492f2021-07-31 19:49:41 -0700192 }
193 }
194 if (log_message) {
195 VLOG(1) << " Data";
196 fs.wants_writer = true;
197 if (!is_local) {
Austin Schuhb06f03b2021-02-17 22:00:37 -0800198 fs.log_type = LogType::kLogRemoteMessage;
199 } else {
Austin Schuh5b728b72021-06-16 14:57:15 -0700200 fs.data_node_index = static_cast<int>(node_index_);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800201 }
202 }
203 if (log_contents) {
204 VLOG(1) << "Timestamp logger channel "
205 << configuration::CleanedChannelToString(channel);
Austin Schuh01f3b392022-01-25 20:03:09 -0800206 auto timestamp_logger_channel_info =
207 timestamp_logger_channels.find(channel);
208 CHECK(timestamp_logger_channel_info != timestamp_logger_channels.end());
209 fs.timestamp_node = std::get<0>(timestamp_logger_channel_info->second);
210 fs.reliable_contents =
211 std::get<1>(timestamp_logger_channel_info->second);
212 fs.channel_reliable_contents =
213 std::get<2>(timestamp_logger_channel_info->second);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800214 fs.wants_contents_writer = true;
215 fs.contents_node_index =
216 configuration::GetNodeIndex(configuration_, fs.timestamp_node);
217 }
218 fetchers_.emplace_back(std::move(fs));
219 }
220 }
Austin Schuhb06f03b2021-02-17 22:00:37 -0800221}
222
223Logger::~Logger() {
224 if (log_namer_) {
225 // If we are replaying a log file, or in simulation, we want to force the
226 // last bit of data to be logged. The easiest way to deal with this is to
Austin Schuh01f3b392022-01-25 20:03:09 -0800227 // poll everything as we go to destroy the class, ie, shut down the
228 // logger, and write it to disk.
Austin Schuhb06f03b2021-02-17 22:00:37 -0800229 StopLogging(event_loop_->monotonic_now());
230 }
231}
232
Austin Schuh6bb8a822021-03-31 23:04:39 -0700233bool Logger::RenameLogBase(std::string new_base_name) {
Naman Gupta41d70c22022-11-21 15:29:52 -0800234 // TODO(Naman): Got a crash in RenameLogBase. Putting in a CHECK_NOTNULL to
235 // catch the bug if it happens again
236 if (new_base_name == CHECK_NOTNULL(log_namer_)->base_name()) {
Austin Schuh6bb8a822021-03-31 23:04:39 -0700237 return true;
238 }
239 std::string current_directory = std::string(log_namer_->base_name());
240 std::string new_directory = new_base_name;
241
242 auto current_path_split = current_directory.rfind("/");
Naman Gupta41d70c22022-11-21 15:29:52 -0800243 CHECK(current_path_split != std::string::npos)
244 << "Could not find / in the current directory path";
Austin Schuh6bb8a822021-03-31 23:04:39 -0700245 auto new_path_split = new_directory.rfind("/");
Naman Gupta41d70c22022-11-21 15:29:52 -0800246 CHECK(new_path_split != std::string::npos)
247 << "Could not find / in the new directory path";
Austin Schuh6bb8a822021-03-31 23:04:39 -0700248
249 CHECK(new_base_name.substr(new_path_split) ==
250 current_directory.substr(current_path_split))
251 << "Rename of file base from " << current_directory << " to "
252 << new_directory << " is not supported.";
253
254 current_directory.resize(current_path_split);
255 new_directory.resize(new_path_split);
256 DIR *dir = opendir(current_directory.c_str());
257 if (dir) {
258 closedir(dir);
259 const int result = rename(current_directory.c_str(), new_directory.c_str());
260 if (result != 0) {
261 PLOG(ERROR) << "Unable to rename " << current_directory << " to "
262 << new_directory;
263 return false;
264 }
265 } else {
266 // Handle if directory was already renamed.
267 dir = opendir(new_directory.c_str());
268 if (!dir) {
269 LOG(ERROR) << "Old directory " << current_directory
270 << " missing and new directory " << new_directory
271 << " not present.";
272 return false;
273 }
274 closedir(dir);
275 }
276
277 log_namer_->set_base_name(new_base_name);
278 Rotate();
279 return true;
280}
281
Brian Smartt796cca02022-04-12 15:07:21 -0700282std::string Logger::WriteConfiguration(LogNamer *log_namer) {
Austin Schuhb06f03b2021-02-17 22:00:37 -0800283 std::string config_sha256;
Brian Smartt03c00da2022-02-24 10:25:00 -0800284
Austin Schuhb06f03b2021-02-17 22:00:37 -0800285 if (separate_config_) {
286 flatbuffers::FlatBufferBuilder fbb;
287 flatbuffers::Offset<aos::Configuration> configuration_offset =
288 CopyFlatBuffer(configuration_, &fbb);
289 LogFileHeader::Builder log_file_header_builder(fbb);
290 log_file_header_builder.add_configuration(configuration_offset);
291 fbb.FinishSizePrefixed(log_file_header_builder.Finish());
292 aos::SizePrefixedFlatbufferDetachedBuffer<LogFileHeader> config_header(
293 fbb.Release());
294 config_sha256 = Sha256(config_header.span());
295 LOG(INFO) << "Config sha256 of " << config_sha256;
Brian Smartt03c00da2022-02-24 10:25:00 -0800296 log_namer->WriteConfiguration(&config_header, config_sha256);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800297 }
298
Brian Smartt03c00da2022-02-24 10:25:00 -0800299 return config_sha256;
300}
301
302void Logger::StartLogging(std::unique_ptr<LogNamer> log_namer,
303 std::optional<UUID> log_start_uuid) {
304 CHECK(!log_namer_) << ": Already logging";
305
306 VLOG(1) << "Starting logger for " << FlatbufferToJson(node_);
307
308 auto config_sha256 = WriteConfiguration(log_namer.get());
309
310 log_namer_ = std::move(log_namer);
311
Austin Schuhb06f03b2021-02-17 22:00:37 -0800312 log_event_uuid_ = UUID::Random();
313 log_start_uuid_ = log_start_uuid;
Austin Schuhb06f03b2021-02-17 22:00:37 -0800314
315 // We want to do as much work as possible before the initial Fetch. Time
316 // between that and actually starting to log opens up the possibility of
317 // falling off the end of the queue during that time.
318
319 for (FetcherStruct &f : fetchers_) {
320 if (f.wants_writer) {
321 f.writer = log_namer_->MakeWriter(f.channel);
322 }
323 if (f.wants_timestamp_writer) {
324 f.timestamp_writer = log_namer_->MakeTimestampWriter(f.channel);
325 }
326 if (f.wants_contents_writer) {
327 f.contents_writer = log_namer_->MakeForwardedTimestampWriter(
328 f.channel, CHECK_NOTNULL(f.timestamp_node));
329 }
330 }
331
Austin Schuh73340842021-07-30 22:32:06 -0700332 log_namer_->SetHeaderTemplate(MakeHeader(config_sha256));
Austin Schuhb06f03b2021-02-17 22:00:37 -0800333
Austin Schuha42ee962021-03-31 22:49:30 -0700334 const aos::monotonic_clock::time_point beginning_time =
335 event_loop_->monotonic_now();
336
Austin Schuhb06f03b2021-02-17 22:00:37 -0800337 // Grab data from each channel right before we declare the log file started
338 // so we can capture the latest message on each channel. This lets us have
339 // non periodic messages with configuration that now get logged.
340 for (FetcherStruct &f : fetchers_) {
341 const auto start = event_loop_->monotonic_now();
342 const bool got_new = f.fetcher->Fetch();
343 const auto end = event_loop_->monotonic_now();
344 RecordFetchResult(start, end, got_new, &f);
345
346 // If there is a message, we want to write it.
347 f.written = f.fetcher->context().data == nullptr;
348 }
349
350 // Clear out any old timestamps in case we are re-starting logging.
Austin Schuh572924a2021-07-30 22:32:12 -0700351 for (size_t i = 0; i < configuration::NodesCount(configuration_); ++i) {
Austin Schuh58646e22021-08-23 23:51:46 -0700352 log_namer_->ClearStartTimes();
Austin Schuhb06f03b2021-02-17 22:00:37 -0800353 }
354
Austin Schuha42ee962021-03-31 22:49:30 -0700355 const aos::monotonic_clock::time_point fetch_time =
356 event_loop_->monotonic_now();
Austin Schuhb06f03b2021-02-17 22:00:37 -0800357 WriteHeader();
Austin Schuha42ee962021-03-31 22:49:30 -0700358 const aos::monotonic_clock::time_point header_time =
359 event_loop_->monotonic_now();
Austin Schuhb06f03b2021-02-17 22:00:37 -0800360
Brian Smartt796cca02022-04-12 15:07:21 -0700361 VLOG(1) << "Logging node as " << FlatbufferToJson(node_) << " start_time "
362 << last_synchronized_time_ << ", took "
Brian Smartt03c00da2022-02-24 10:25:00 -0800363 << chrono::duration<double>(fetch_time - beginning_time).count()
364 << " to fetch, "
365 << chrono::duration<double>(header_time - fetch_time).count()
366 << " to write headers, boot uuid " << event_loop_->boot_uuid();
Austin Schuhb06f03b2021-02-17 22:00:37 -0800367
368 // Force logging up until the start of the log file now, so the messages at
369 // the start are always ordered before the rest of the messages.
370 // Note: this ship may have already sailed, but we don't have to make it
371 // worse.
372 // TODO(austin): Test...
Austin Schuh855f8932021-03-19 22:01:32 -0700373 //
Naman Gupta41d70c22022-11-21 15:29:52 -0800374 // This is safe to call here since we have set last_synchronized_time_ as
375 // the same time as in the header, and all the data before it should be
376 // logged without ordering concerns.
Austin Schuhb06f03b2021-02-17 22:00:37 -0800377 LogUntil(last_synchronized_time_);
378
379 timer_handler_->Setup(event_loop_->monotonic_now() + polling_period_,
380 polling_period_);
381}
382
Brian Smartt796cca02022-04-12 15:07:21 -0700383std::unique_ptr<LogNamer> Logger::RestartLogging(
384 std::unique_ptr<LogNamer> log_namer, std::optional<UUID> log_start_uuid) {
Brian Smartt03c00da2022-02-24 10:25:00 -0800385 CHECK(log_namer_) << ": Unexpected restart while not logging";
386
387 VLOG(1) << "Restarting logger for " << FlatbufferToJson(node_);
388
389 // Force out every currently pending message, pointing all fetchers at the
390 // last (currently available) records. Note that LogUntil() updates
391 // last_synchronized_time_ to the time value that it receives.
Brian Smartt796cca02022-04-12 15:07:21 -0700392 while (LogUntil(last_synchronized_time_ + polling_period_))
393 ;
Brian Smartt03c00da2022-02-24 10:25:00 -0800394
395 std::unique_ptr<LogNamer> old_log_namer = std::move(log_namer_);
396 log_namer_ = std::move(log_namer);
397
Naman Gupta41d70c22022-11-21 15:29:52 -0800398 // Now grab a representative time on both the RT and monotonic clock.
399 // Average a monotonic clock before and after to reduce the error.
Brian Smartt03c00da2022-02-24 10:25:00 -0800400 const aos::monotonic_clock::time_point beginning_time =
401 event_loop_->monotonic_now();
Austin Schuh41f8df92022-04-15 11:45:52 -0700402 const aos::realtime_clock::time_point beginning_time_rt =
403 event_loop_->realtime_now();
404 const aos::monotonic_clock::time_point beginning_time2 =
405 event_loop_->monotonic_now();
406
407 if (beginning_time > last_synchronized_time_) {
408 LOG(WARNING) << "Took over " << polling_period_.count()
409 << "ns to swap log_namer";
410 }
411
Naman Gupta41d70c22022-11-21 15:29:52 -0800412 // Since we are going to log all in 1 big go, we need our log start time to
413 // be after the previous LogUntil call finished, but before 1 period after
414 // it. The best way to guarentee that is to pick a start time that is the
415 // earliest of the two. That covers the case where the OS puts us to sleep
416 // between when we finish LogUntil and capture beginning_time.
Austin Schuh41f8df92022-04-15 11:45:52 -0700417 const aos::monotonic_clock::time_point monotonic_start_time =
418 std::min(last_synchronized_time_, beginning_time);
419 const aos::realtime_clock::time_point realtime_start_time =
420 (beginning_time_rt + (monotonic_start_time.time_since_epoch() -
421 ((beginning_time.time_since_epoch() +
422 beginning_time2.time_since_epoch()) /
423 2)));
Brian Smartt03c00da2022-02-24 10:25:00 -0800424
425 auto config_sha256 = WriteConfiguration(log_namer_.get());
426
427 log_event_uuid_ = UUID::Random();
428 log_start_uuid_ = log_start_uuid;
429
430 log_namer_->SetHeaderTemplate(MakeHeader(config_sha256));
431
432 // Note that WriteHeader updates last_synchronized_time_ to be the
433 // current time when it is called, which is then the "start time"
434 // of the new (restarted) log. This timestamp will be after
Naman Gupta41d70c22022-11-21 15:29:52 -0800435 // the timestamp of the last message fetched on each channel, but is
436 // carefully picked per the comment above to not violate
437 // max_out_of_order_duration.
Austin Schuh41f8df92022-04-15 11:45:52 -0700438 WriteHeader(monotonic_start_time, realtime_start_time);
Brian Smartt03c00da2022-02-24 10:25:00 -0800439
440 const aos::monotonic_clock::time_point header_time =
441 event_loop_->monotonic_now();
442
443 // Write the transition record(s) for each channel ...
444 for (FetcherStruct &f : fetchers_) {
Brian Smartt03c00da2022-02-24 10:25:00 -0800445 // Create writers from the new namer
446 NewDataWriter *next_writer = nullptr;
447 NewDataWriter *next_timestamp_writer = nullptr;
448 NewDataWriter *next_contents_writer = nullptr;
449
450 if (f.wants_writer) {
451 next_writer = log_namer_->MakeWriter(f.channel);
452 }
453 if (f.wants_timestamp_writer) {
454 next_timestamp_writer = log_namer_->MakeTimestampWriter(f.channel);
455 }
456 if (f.wants_contents_writer) {
457 next_contents_writer = log_namer_->MakeForwardedTimestampWriter(
458 f.channel, CHECK_NOTNULL(f.timestamp_node));
459 }
460
461 if (f.fetcher->context().data != nullptr) {
Brian Smartt796cca02022-04-12 15:07:21 -0700462 // Write the last message fetched as the first of the new log of this
463 // type. The timestamps on these will all be before the new start time.
Brian Smartt03c00da2022-02-24 10:25:00 -0800464 WriteData(next_writer, f);
465 WriteTimestamps(next_timestamp_writer, f);
466 WriteContent(next_contents_writer, f);
467
Brian Smartt796cca02022-04-12 15:07:21 -0700468 // It is possible that a few more snuck in. Write them all out also,
469 // including any that should also be in the old log.
Brian Smartt03c00da2022-02-24 10:25:00 -0800470 while (true) {
Brian Smartt796cca02022-04-12 15:07:21 -0700471 // Get the next message ...
472 const auto start = event_loop_->monotonic_now();
473 const bool got_new = f.fetcher->FetchNext();
474 const auto end = event_loop_->monotonic_now();
475 RecordFetchResult(start, end, got_new, &f);
Brian Smartt03c00da2022-02-24 10:25:00 -0800476
Brian Smartt796cca02022-04-12 15:07:21 -0700477 if (got_new) {
478 if (f.fetcher->context().monotonic_event_time <=
479 last_synchronized_time_) {
480 WriteFetchedRecord(f);
Brian Smartt03c00da2022-02-24 10:25:00 -0800481 WriteData(next_writer, f);
482 WriteTimestamps(next_timestamp_writer, f);
483 WriteContent(next_contents_writer, f);
484
Brian Smartt03c00da2022-02-24 10:25:00 -0800485 } else {
Brian Smartt796cca02022-04-12 15:07:21 -0700486 f.written = false;
Brian Smartt03c00da2022-02-24 10:25:00 -0800487 break;
488 }
Brian Smartt796cca02022-04-12 15:07:21 -0700489
490 } else {
491 f.written = true;
492 break;
493 }
Brian Smartt03c00da2022-02-24 10:25:00 -0800494 }
495 }
496
497 // Switch fully over to the new writers.
498 f.writer = next_writer;
499 f.timestamp_writer = next_timestamp_writer;
500 f.contents_writer = next_contents_writer;
Brian Smartt03c00da2022-02-24 10:25:00 -0800501 }
502
503 const aos::monotonic_clock::time_point channel_time =
504 event_loop_->monotonic_now();
505
Brian Smartt796cca02022-04-12 15:07:21 -0700506 VLOG(1) << "Logging node as " << FlatbufferToJson(node_) << " restart_time "
507 << last_synchronized_time_ << ", took "
Brian Smartt03c00da2022-02-24 10:25:00 -0800508 << chrono::duration<double>(header_time - beginning_time).count()
509 << " to prepare and write header, "
510 << chrono::duration<double>(channel_time - header_time).count()
Brian Smartt796cca02022-04-12 15:07:21 -0700511 << " to write initial channel messages, boot uuid "
512 << event_loop_->boot_uuid();
Brian Smartt03c00da2022-02-24 10:25:00 -0800513
514 return old_log_namer;
515}
516
Austin Schuhb06f03b2021-02-17 22:00:37 -0800517std::unique_ptr<LogNamer> Logger::StopLogging(
518 aos::monotonic_clock::time_point end_time) {
519 CHECK(log_namer_) << ": Not logging right now";
520
521 if (end_time != aos::monotonic_clock::min_time) {
Austin Schuh30586902021-03-30 22:54:08 -0700522 // Folks like to use the on_logged_period_ callback to trigger stop and
523 // start events. We can't have those then recurse and try to stop again.
524 // Rather than making everything reentrant, let's just instead block the
525 // callback here.
526 DoLogData(end_time, false);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800527 }
528 timer_handler_->Disable();
529
530 for (FetcherStruct &f : fetchers_) {
531 f.writer = nullptr;
532 f.timestamp_writer = nullptr;
533 f.contents_writer = nullptr;
534 }
Austin Schuhb06f03b2021-02-17 22:00:37 -0800535
536 log_event_uuid_ = UUID::Zero();
Austin Schuh34f9e482021-03-31 22:54:18 -0700537 log_start_uuid_ = std::nullopt;
Austin Schuhb06f03b2021-02-17 22:00:37 -0800538
539 return std::move(log_namer_);
540}
541
Austin Schuh41f8df92022-04-15 11:45:52 -0700542void Logger::WriteHeader(aos::monotonic_clock::time_point monotonic_start_time,
543 aos::realtime_clock::time_point realtime_start_time) {
Austin Schuhb06f03b2021-02-17 22:00:37 -0800544 if (configuration::MultiNode(configuration_)) {
545 server_statistics_fetcher_.Fetch();
546 }
547
Austin Schuh41f8df92022-04-15 11:45:52 -0700548 if (monotonic_start_time == aos::monotonic_clock::min_time) {
549 monotonic_start_time = event_loop_->monotonic_now();
550 realtime_start_time = event_loop_->realtime_now();
551 }
Austin Schuhb06f03b2021-02-17 22:00:37 -0800552
553 // We need to pick a point in time to declare the log file "started". This
554 // starts here. It needs to be after everything is fetched so that the
555 // fetchers are all pointed at the most recent message before the start
556 // time.
557 last_synchronized_time_ = monotonic_start_time;
558
559 for (const Node *node : log_namer_->nodes()) {
560 const int node_index = configuration::GetNodeIndex(configuration_, node);
561 MaybeUpdateTimestamp(node, node_index, monotonic_start_time,
562 realtime_start_time);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800563 }
564}
565
Austin Schuhb06f03b2021-02-17 22:00:37 -0800566void Logger::WriteMissingTimestamps() {
567 if (configuration::MultiNode(configuration_)) {
568 server_statistics_fetcher_.Fetch();
569 } else {
570 return;
571 }
572
573 if (server_statistics_fetcher_.get() == nullptr) {
574 return;
575 }
576
577 for (const Node *node : log_namer_->nodes()) {
578 const int node_index = configuration::GetNodeIndex(configuration_, node);
579 if (MaybeUpdateTimestamp(
580 node, node_index,
581 server_statistics_fetcher_.context().monotonic_event_time,
582 server_statistics_fetcher_.context().realtime_event_time)) {
Austin Schuh58646e22021-08-23 23:51:46 -0700583 VLOG(1) << "Timestamps changed on " << aos::FlatbufferToJson(node);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800584 }
585 }
586}
587
Austin Schuhb06f03b2021-02-17 22:00:37 -0800588bool Logger::MaybeUpdateTimestamp(
589 const Node *node, int node_index,
590 aos::monotonic_clock::time_point monotonic_start_time,
591 aos::realtime_clock::time_point realtime_start_time) {
592 // Bail early if the start times are already set.
Austin Schuh58646e22021-08-23 23:51:46 -0700593 if (node_ == node || !configuration::MultiNode(configuration_)) {
594 if (log_namer_->monotonic_start_time(node_index,
595 event_loop_->boot_uuid()) !=
596 monotonic_clock::min_time) {
597 return false;
598 }
Brian Smartt03c00da2022-02-24 10:25:00 -0800599
Austin Schuhb06f03b2021-02-17 22:00:37 -0800600 // There are no offsets to compute for ourself, so always succeed.
Austin Schuh58646e22021-08-23 23:51:46 -0700601 log_namer_->SetStartTimes(node_index, event_loop_->boot_uuid(),
602 monotonic_start_time, realtime_start_time,
603 monotonic_start_time, realtime_start_time);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800604 return true;
605 } else if (server_statistics_fetcher_.get() != nullptr) {
606 // We must be a remote node now. Look for the connection and see if it is
607 // connected.
James Kuszmaul17607fb2021-10-15 20:00:32 -0700608 CHECK(server_statistics_fetcher_->has_connections());
Austin Schuhb06f03b2021-02-17 22:00:37 -0800609
610 for (const message_bridge::ServerConnection *connection :
611 *server_statistics_fetcher_->connections()) {
612 if (connection->node()->name()->string_view() !=
613 node->name()->string_view()) {
614 continue;
615 }
616
617 if (connection->state() != message_bridge::State::CONNECTED) {
618 VLOG(1) << node->name()->string_view()
619 << " is not connected, can't start it yet.";
620 break;
621 }
622
Austin Schuhb06f03b2021-02-17 22:00:37 -0800623 if (!connection->has_monotonic_offset()) {
624 VLOG(1) << "Missing monotonic offset for setting start time for node "
625 << aos::FlatbufferToJson(node);
626 break;
627 }
628
James Kuszmaul17607fb2021-10-15 20:00:32 -0700629 CHECK(connection->has_boot_uuid());
Austin Schuh58646e22021-08-23 23:51:46 -0700630 const UUID boot_uuid =
631 UUID::FromString(connection->boot_uuid()->string_view());
632
633 if (log_namer_->monotonic_start_time(node_index, boot_uuid) !=
634 monotonic_clock::min_time) {
635 break;
636 }
637
638 VLOG(1) << "Updating start time for "
639 << aos::FlatbufferToJson(connection);
640
Austin Schuhb06f03b2021-02-17 22:00:37 -0800641 // Found it and it is connected. Compensate and go.
Austin Schuh73340842021-07-30 22:32:06 -0700642 log_namer_->SetStartTimes(
Austin Schuh58646e22021-08-23 23:51:46 -0700643 node_index, boot_uuid,
Austin Schuh73340842021-07-30 22:32:06 -0700644 monotonic_start_time +
645 std::chrono::nanoseconds(connection->monotonic_offset()),
646 realtime_start_time, monotonic_start_time, realtime_start_time);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800647 return true;
648 }
649 }
650 return false;
651}
652
653aos::SizePrefixedFlatbufferDetachedBuffer<LogFileHeader> Logger::MakeHeader(
Austin Schuh73340842021-07-30 22:32:06 -0700654 std::string_view config_sha256) {
Austin Schuhb06f03b2021-02-17 22:00:37 -0800655 flatbuffers::FlatBufferBuilder fbb;
656 fbb.ForceDefaults(true);
657
658 flatbuffers::Offset<aos::Configuration> configuration_offset;
659 if (!separate_config_) {
660 configuration_offset = CopyFlatBuffer(configuration_, &fbb);
661 } else {
662 CHECK(!config_sha256.empty());
663 }
664
665 const flatbuffers::Offset<flatbuffers::String> name_offset =
666 fbb.CreateString(name_);
667
Austin Schuhfa712682022-05-11 16:43:42 -0700668 const flatbuffers::Offset<flatbuffers::String> logger_sha1_offset =
669 logger_sha1_.empty() ? 0 : fbb.CreateString(logger_sha1_);
670 const flatbuffers::Offset<flatbuffers::String> logger_version_offset =
671 logger_version_.empty() ? 0 : fbb.CreateString(logger_version_);
672
Austin Schuhb06f03b2021-02-17 22:00:37 -0800673 CHECK(log_event_uuid_ != UUID::Zero());
674 const flatbuffers::Offset<flatbuffers::String> log_event_uuid_offset =
Austin Schuh5e2bfb82021-03-13 22:46:55 -0800675 log_event_uuid_.PackString(&fbb);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800676
677 const flatbuffers::Offset<flatbuffers::String> logger_instance_uuid_offset =
Austin Schuh5e2bfb82021-03-13 22:46:55 -0800678 logger_instance_uuid_.PackString(&fbb);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800679
680 flatbuffers::Offset<flatbuffers::String> log_start_uuid_offset;
Austin Schuh34f9e482021-03-31 22:54:18 -0700681 if (log_start_uuid_) {
682 log_start_uuid_offset = fbb.CreateString(log_start_uuid_->ToString());
Austin Schuhb06f03b2021-02-17 22:00:37 -0800683 }
684
685 flatbuffers::Offset<flatbuffers::String> config_sha256_offset;
686 if (!config_sha256.empty()) {
687 config_sha256_offset = fbb.CreateString(config_sha256);
688 }
689
690 const flatbuffers::Offset<flatbuffers::String> logger_node_boot_uuid_offset =
Austin Schuh5e2bfb82021-03-13 22:46:55 -0800691 event_loop_->boot_uuid().PackString(&fbb);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800692
Austin Schuhb06f03b2021-02-17 22:00:37 -0800693 flatbuffers::Offset<Node> logger_node_offset;
694
695 if (configuration::MultiNode(configuration_)) {
Austin Schuh5b728b72021-06-16 14:57:15 -0700696 logger_node_offset = RecursiveCopyFlatBuffer(node_, &fbb);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800697 }
698
699 aos::logger::LogFileHeader::Builder log_file_header_builder(fbb);
700
701 log_file_header_builder.add_name(name_offset);
Austin Schuhfa712682022-05-11 16:43:42 -0700702 if (!logger_sha1_offset.IsNull()) {
703 log_file_header_builder.add_logger_sha1(logger_sha1_offset);
704 }
705 if (!logger_version_offset.IsNull()) {
706 log_file_header_builder.add_logger_version(logger_version_offset);
707 }
Austin Schuhb06f03b2021-02-17 22:00:37 -0800708
709 // Only add the node if we are running in a multinode configuration.
Austin Schuh73340842021-07-30 22:32:06 -0700710 if (configuration::MultiNode(configuration_)) {
Austin Schuhb06f03b2021-02-17 22:00:37 -0800711 log_file_header_builder.add_logger_node(logger_node_offset);
712 }
713
714 if (!configuration_offset.IsNull()) {
715 log_file_header_builder.add_configuration(configuration_offset);
716 }
717 // The worst case theoretical out of order is the polling period times 2.
718 // One message could get logged right after the boundary, but be for right
719 // before the next boundary. And the reverse could happen for another
720 // message. Report back 3x to be extra safe, and because the cost isn't
721 // huge on the read side.
722 log_file_header_builder.add_max_out_of_order_duration(
723 std::chrono::nanoseconds(3 * polling_period_).count());
724
Austin Schuhb06f03b2021-02-17 22:00:37 -0800725 log_file_header_builder.add_log_event_uuid(log_event_uuid_offset);
726 log_file_header_builder.add_logger_instance_uuid(logger_instance_uuid_offset);
727 if (!log_start_uuid_offset.IsNull()) {
728 log_file_header_builder.add_log_start_uuid(log_start_uuid_offset);
729 }
730 log_file_header_builder.add_logger_node_boot_uuid(
731 logger_node_boot_uuid_offset);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800732
733 if (!config_sha256_offset.IsNull()) {
734 log_file_header_builder.add_configuration_sha256(config_sha256_offset);
735 }
736
737 fbb.FinishSizePrefixed(log_file_header_builder.Finish());
738 aos::SizePrefixedFlatbufferDetachedBuffer<LogFileHeader> result(
739 fbb.Release());
740
741 CHECK(result.Verify()) << ": Built a corrupted header.";
742
743 return result;
744}
745
746void Logger::ResetStatisics() {
747 max_message_fetch_time_ = std::chrono::nanoseconds::zero();
748 max_message_fetch_time_channel_ = -1;
749 max_message_fetch_time_size_ = -1;
750 total_message_fetch_time_ = std::chrono::nanoseconds::zero();
751 total_message_fetch_count_ = 0;
752 total_message_fetch_bytes_ = 0;
753 total_nop_fetch_time_ = std::chrono::nanoseconds::zero();
754 total_nop_fetch_count_ = 0;
755 max_copy_time_ = std::chrono::nanoseconds::zero();
756 max_copy_time_channel_ = -1;
757 max_copy_time_size_ = -1;
758 total_copy_time_ = std::chrono::nanoseconds::zero();
759 total_copy_count_ = 0;
760 total_copy_bytes_ = 0;
761}
762
763void Logger::Rotate() {
764 for (const Node *node : log_namer_->nodes()) {
Austin Schuh73340842021-07-30 22:32:06 -0700765 log_namer_->Rotate(node);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800766 }
767}
768
Austin Schuh48d10d62022-10-16 22:19:23 -0700769// Class to copy a context into the provided buffer.
770class ContextDataCopier : public DataEncoder::Copier {
771 public:
Naman Gupta41d70c22022-11-21 15:29:52 -0800772 ContextDataCopier(const Context &context, int channel_index, LogType log_type,
773 EventLoop *event_loop)
Austin Schuh48d10d62022-10-16 22:19:23 -0700774 : DataEncoder::Copier(PackMessageSize(log_type, context.size)),
775 context_(context),
776 channel_index_(channel_index),
777 log_type_(log_type),
778 event_loop_(event_loop) {}
779
780 monotonic_clock::time_point end_time() const { return end_time_; }
781
782 size_t Copy(uint8_t *data) final {
783 size_t result =
784 PackMessageInline(data, context_, channel_index_, log_type_);
785 end_time_ = event_loop_->monotonic_now();
786 return result;
787 }
788
789 private:
790 const Context &context_;
791 const int channel_index_;
792 const LogType log_type_;
793 EventLoop *event_loop_;
794 monotonic_clock::time_point end_time_;
795};
796
797// Class to copy a RemoteMessage into the provided buffer.
798class RemoteMessageCopier : public DataEncoder::Copier {
799 public:
Naman Gupta41d70c22022-11-21 15:29:52 -0800800 RemoteMessageCopier(const message_bridge::RemoteMessage *message,
801 int channel_index,
802 aos::monotonic_clock::time_point monotonic_timestamp_time,
803 EventLoop *event_loop)
Austin Schuh48d10d62022-10-16 22:19:23 -0700804 : DataEncoder::Copier(PackRemoteMessageSize()),
805 message_(message),
806 channel_index_(channel_index),
807 monotonic_timestamp_time_(monotonic_timestamp_time),
808 event_loop_(event_loop) {}
809
810 monotonic_clock::time_point end_time() const { return end_time_; }
811
812 size_t Copy(uint8_t *data) final {
813 size_t result = PackRemoteMessageInline(data, message_, channel_index_,
814 monotonic_timestamp_time_);
815 end_time_ = event_loop_->monotonic_now();
816 return result;
817 }
818
819 private:
820 const message_bridge::RemoteMessage *message_;
821 int channel_index_;
822 aos::monotonic_clock::time_point monotonic_timestamp_time_;
823 EventLoop *event_loop_;
824 monotonic_clock::time_point end_time_;
825};
826
Brian Smartt03c00da2022-02-24 10:25:00 -0800827void Logger::WriteData(NewDataWriter *writer, const FetcherStruct &f) {
828 if (writer != nullptr) {
829 const UUID source_node_boot_uuid =
830 static_cast<int>(node_index_) != f.data_node_index
831 ? f.fetcher->context().source_boot_uuid
832 : event_loop_->boot_uuid();
833 // Write!
834 const auto start = event_loop_->monotonic_now();
Brian Smartt03c00da2022-02-24 10:25:00 -0800835
Naman Gupta41d70c22022-11-21 15:29:52 -0800836 ContextDataCopier coppier(f.fetcher->context(), f.channel_index, f.log_type,
837 event_loop_);
Brian Smartt03c00da2022-02-24 10:25:00 -0800838
Austin Schuh48d10d62022-10-16 22:19:23 -0700839 writer->CopyMessage(&coppier, source_node_boot_uuid, start);
840 RecordCreateMessageTime(start, coppier.end_time(), f);
Brian Smartt03c00da2022-02-24 10:25:00 -0800841
Brian Smartt796cca02022-04-12 15:07:21 -0700842 VLOG(2) << "Wrote data as node " << FlatbufferToJson(node_)
843 << " for channel "
Brian Smartt03c00da2022-02-24 10:25:00 -0800844 << configuration::CleanedChannelToString(f.fetcher->channel())
Austin Schuh48d10d62022-10-16 22:19:23 -0700845 << " to " << writer->filename();
Brian Smartt03c00da2022-02-24 10:25:00 -0800846 }
847}
848
Brian Smartt796cca02022-04-12 15:07:21 -0700849void Logger::WriteTimestamps(NewDataWriter *timestamp_writer,
850 const FetcherStruct &f) {
Brian Smartt03c00da2022-02-24 10:25:00 -0800851 if (timestamp_writer != nullptr) {
852 // And now handle timestamps.
Brian Smartt03c00da2022-02-24 10:25:00 -0800853
854 // Tell our writer that we know something about the remote boot.
855 timestamp_writer->UpdateRemote(
856 f.data_node_index, f.fetcher->context().source_boot_uuid,
857 f.fetcher->context().monotonic_remote_time,
858 f.fetcher->context().monotonic_event_time, f.reliable_forwarding);
Austin Schuh48d10d62022-10-16 22:19:23 -0700859
860 const auto start = event_loop_->monotonic_now();
861 ContextDataCopier coppier(f.fetcher->context(), f.channel_index,
Naman Gupta41d70c22022-11-21 15:29:52 -0800862 LogType::kLogDeliveryTimeOnly, event_loop_);
Austin Schuh48d10d62022-10-16 22:19:23 -0700863
864 timestamp_writer->CopyMessage(&coppier, event_loop_->boot_uuid(), start);
865 RecordCreateMessageTime(start, coppier.end_time(), f);
Brian Smartt03c00da2022-02-24 10:25:00 -0800866
Brian Smartt796cca02022-04-12 15:07:21 -0700867 VLOG(2) << "Wrote timestamps as node " << FlatbufferToJson(node_)
868 << " for channel "
Brian Smartt03c00da2022-02-24 10:25:00 -0800869 << configuration::CleanedChannelToString(f.fetcher->channel())
Austin Schuh48d10d62022-10-16 22:19:23 -0700870 << " to " << timestamp_writer->filename() << " timestamp";
Brian Smartt03c00da2022-02-24 10:25:00 -0800871 }
872}
873
Brian Smartt796cca02022-04-12 15:07:21 -0700874void Logger::WriteContent(NewDataWriter *contents_writer,
875 const FetcherStruct &f) {
Brian Smartt03c00da2022-02-24 10:25:00 -0800876 if (contents_writer != nullptr) {
877 const auto start = event_loop_->monotonic_now();
878 // And now handle the special message contents channel. Copy the
879 // message into a FlatBufferBuilder and save it to disk.
Brian Smartt03c00da2022-02-24 10:25:00 -0800880 const RemoteMessage *msg =
881 flatbuffers::GetRoot<RemoteMessage>(f.fetcher->context().data);
882
883 CHECK(msg->has_boot_uuid()) << ": " << aos::FlatbufferToJson(msg);
Brian Smartt03c00da2022-02-24 10:25:00 -0800884 // Translate from the channel index that the event loop uses to the
885 // channel index in the log file.
Austin Schuhf2d0e682022-10-16 14:20:58 -0700886 const int channel_index =
887 event_loop_to_logged_channel_index_[msg->channel_index()];
Brian Smartt03c00da2022-02-24 10:25:00 -0800888
889 const aos::monotonic_clock::time_point monotonic_timestamp_time =
890 f.fetcher->context().monotonic_event_time;
Brian Smartt03c00da2022-02-24 10:25:00 -0800891
Brian Smartt03c00da2022-02-24 10:25:00 -0800892 // Timestamps tell us information about what happened too!
893 // Capture any reboots so UpdateRemote is properly recorded.
894 contents_writer->UpdateBoot(UUID::FromVector(msg->boot_uuid()));
895
896 // Start with recording info about the data flowing from our node to the
897 // remote.
898 const bool reliable =
899 f.channel_reliable_contents.size() != 0u
900 ? f.channel_reliable_contents[msg->channel_index()]
901 : f.reliable_contents;
902
Brian Smartt796cca02022-04-12 15:07:21 -0700903 contents_writer->UpdateRemote(
904 node_index_, event_loop_->boot_uuid(),
Brian Smartt03c00da2022-02-24 10:25:00 -0800905 monotonic_clock::time_point(
906 chrono::nanoseconds(msg->monotonic_remote_time())),
907 monotonic_clock::time_point(
908 chrono::nanoseconds(msg->monotonic_sent_time())),
909 reliable, monotonic_timestamp_time);
910
Austin Schuh48d10d62022-10-16 22:19:23 -0700911 RemoteMessageCopier coppier(msg, channel_index, monotonic_timestamp_time,
Naman Gupta41d70c22022-11-21 15:29:52 -0800912 event_loop_);
Austin Schuh48d10d62022-10-16 22:19:23 -0700913
914 contents_writer->CopyMessage(&coppier, UUID::FromVector(msg->boot_uuid()),
915 start);
916
917 RecordCreateMessageTime(start, coppier.end_time(), f);
Brian Smartt03c00da2022-02-24 10:25:00 -0800918 }
919}
920
921void Logger::WriteFetchedRecord(FetcherStruct &f) {
922 WriteData(f.writer, f);
923 WriteTimestamps(f.timestamp_writer, f);
924 WriteContent(f.contents_writer, f);
925}
926
927bool Logger::LogUntil(monotonic_clock::time_point t) {
928 bool has_pending_messages = false;
929
Austin Schuhb06f03b2021-02-17 22:00:37 -0800930 // Grab the latest ServerStatistics message. This will always have the
931 // oppertunity to be >= to the current time, so it will always represent any
932 // reboots which may have happened.
933 WriteMissingTimestamps();
934
935 // Write each channel to disk, one at a time.
936 for (FetcherStruct &f : fetchers_) {
937 while (true) {
938 if (f.written) {
939 const auto start = event_loop_->monotonic_now();
940 const bool got_new = f.fetcher->FetchNext();
941 const auto end = event_loop_->monotonic_now();
942 RecordFetchResult(start, end, got_new, &f);
943 if (!got_new) {
944 VLOG(2) << "No new data on "
945 << configuration::CleanedChannelToString(
946 f.fetcher->channel());
947 break;
948 }
949 f.written = false;
950 }
951
952 // TODO(james): Write tests to exercise this logic.
953 if (f.fetcher->context().monotonic_event_time >= t) {
Brian Smartt03c00da2022-02-24 10:25:00 -0800954 has_pending_messages = true;
Austin Schuhb06f03b2021-02-17 22:00:37 -0800955 break;
956 }
Austin Schuhb06f03b2021-02-17 22:00:37 -0800957
Brian Smartt03c00da2022-02-24 10:25:00 -0800958 WriteFetchedRecord(f);
Austin Schuhb06f03b2021-02-17 22:00:37 -0800959
960 f.written = true;
961 }
962 }
963 last_synchronized_time_ = t;
Brian Smartt03c00da2022-02-24 10:25:00 -0800964
965 return has_pending_messages;
Austin Schuhb06f03b2021-02-17 22:00:37 -0800966}
967
Austin Schuh30586902021-03-30 22:54:08 -0700968void Logger::DoLogData(const monotonic_clock::time_point end_time,
969 bool run_on_logged) {
Austin Schuhb06f03b2021-02-17 22:00:37 -0800970 // We want to guarantee that messages aren't out of order by more than
971 // max_out_of_order_duration. To do this, we need sync points. Every write
972 // cycle should be a sync point.
973
974 do {
975 // Move the sync point up by at most polling_period. This forces one sync
976 // per iteration, even if it is small.
977 LogUntil(std::min(last_synchronized_time_ + polling_period_, end_time));
978
Austin Schuh30586902021-03-30 22:54:08 -0700979 if (run_on_logged) {
980 on_logged_period_();
981 }
Austin Schuhb06f03b2021-02-17 22:00:37 -0800982
983 // If we missed cycles, we could be pretty far behind. Spin until we are
984 // caught up.
985 } while (last_synchronized_time_ + polling_period_ < end_time);
986}
987
988void Logger::RecordFetchResult(aos::monotonic_clock::time_point start,
989 aos::monotonic_clock::time_point end,
990 bool got_new, FetcherStruct *fetcher) {
991 const auto duration = end - start;
992 if (!got_new) {
993 ++total_nop_fetch_count_;
994 total_nop_fetch_time_ += duration;
995 return;
996 }
997 ++total_message_fetch_count_;
998 total_message_fetch_bytes_ += fetcher->fetcher->context().size;
999 total_message_fetch_time_ += duration;
1000 if (duration > max_message_fetch_time_) {
1001 max_message_fetch_time_ = duration;
1002 max_message_fetch_time_channel_ = fetcher->channel_index;
1003 max_message_fetch_time_size_ = fetcher->fetcher->context().size;
1004 }
1005}
1006
1007void Logger::RecordCreateMessageTime(aos::monotonic_clock::time_point start,
1008 aos::monotonic_clock::time_point end,
Brian Smartt03c00da2022-02-24 10:25:00 -08001009 const FetcherStruct &fetcher) {
Austin Schuhb06f03b2021-02-17 22:00:37 -08001010 const auto duration = end - start;
1011 total_copy_time_ += duration;
1012 ++total_copy_count_;
Brian Smartt03c00da2022-02-24 10:25:00 -08001013 total_copy_bytes_ += fetcher.fetcher->context().size;
Austin Schuhb06f03b2021-02-17 22:00:37 -08001014 if (duration > max_copy_time_) {
1015 max_copy_time_ = duration;
Brian Smartt03c00da2022-02-24 10:25:00 -08001016 max_copy_time_channel_ = fetcher.channel_index;
1017 max_copy_time_size_ = fetcher.fetcher->context().size;
Austin Schuhb06f03b2021-02-17 22:00:37 -08001018 }
1019}
1020
1021} // namespace logger
1022} // namespace aos