blob: 8293956cf266154754682677861b9900008324fb [file] [log] [blame]
Austin Schuhb06f03b2021-02-17 22:00:37 -08001#ifndef AOS_EVENTS_LOGGING_LOG_READER_H_
2#define AOS_EVENTS_LOGGING_LOG_READER_H_
Austin Schuhe309d2a2019-11-29 13:25:21 -08003
Austin Schuh8bd96322020-02-13 21:18:22 -08004#include <chrono>
Austin Schuhe309d2a2019-11-29 13:25:21 -08005#include <deque>
Austin Schuh05b70472020-01-01 17:11:17 -08006#include <string_view>
Austin Schuh2f8fd752020-09-01 22:38:28 -07007#include <tuple>
Austin Schuh6f3babe2020-01-26 20:34:50 -08008#include <vector>
Austin Schuhe309d2a2019-11-29 13:25:21 -08009
Austin Schuhe309d2a2019-11-29 13:25:21 -080010#include "aos/events/event_loop.h"
Austin Schuhf6f9bf32020-10-11 14:37:43 -070011#include "aos/events/logging/logfile_sorting.h"
Austin Schuha36c8902019-12-30 18:07:15 -080012#include "aos/events/logging/logfile_utils.h"
James Kuszmaul38735e82019-12-07 16:42:06 -080013#include "aos/events/logging/logger_generated.h"
Austin Schuh92547522019-12-28 14:33:43 -080014#include "aos/events/simulated_event_loop.h"
Austin Schuh2f8fd752020-09-01 22:38:28 -070015#include "aos/network/message_bridge_server_generated.h"
Austin Schuh0ca1fd32020-12-18 22:53:05 -080016#include "aos/network/multinode_timestamp_filter.h"
Austin Schuh0de30f32020-12-06 12:44:28 -080017#include "aos/network/remote_message_generated.h"
Austin Schuh8bd96322020-02-13 21:18:22 -080018#include "aos/network/timestamp_filter.h"
Austin Schuhe309d2a2019-11-29 13:25:21 -080019#include "aos/time/time.h"
Austin Schuh4385b142021-03-14 21:31:13 -070020#include "aos/uuid.h"
Austin Schuhe309d2a2019-11-29 13:25:21 -080021#include "flatbuffers/flatbuffers.h"
22
23namespace aos {
24namespace logger {
25
Austin Schuh6f3babe2020-01-26 20:34:50 -080026// We end up with one of the following 3 log file types.
27//
28// Single node logged as the source node.
29// -> Replayed just on the source node.
30//
31// Forwarding timestamps only logged from the perspective of the destination
32// node.
33// -> Matched with data on source node and logged.
34//
35// Forwarding timestamps with data logged as the destination node.
36// -> Replayed just as the destination
37// -> Replayed as the source (Much harder, ordering is not defined)
38//
39// Duplicate data logged. -> CHECK that it matches and explode otherwise.
40//
41// This can be boiled down to a set of constraints and tools.
42//
43// 1) Forwarding timestamps and data need to be logged separately.
44// 2) Any forwarded data logged on the destination node needs to be logged
45// separately such that it can be sorted.
46//
47// 1) Log reader needs to be able to sort a list of log files.
48// 2) Log reader needs to be able to merge sorted lists of log files.
49// 3) Log reader needs to be able to match timestamps with messages.
50//
51// We also need to be able to generate multiple views of a log file depending on
52// the target.
53
Austin Schuhe309d2a2019-11-29 13:25:21 -080054// Replays all the channels in the logfile to the event loop.
55class LogReader {
56 public:
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -080057 // If you want to supply a new configuration that will be used for replay
58 // (e.g., to change message rates, or to populate an updated schema), then
59 // pass it in here. It must provide all the channels that the original logged
60 // config did.
Austin Schuh6f3babe2020-01-26 20:34:50 -080061 //
Austin Schuh287d43d2020-12-04 20:19:33 -080062 // The single file constructor calls SortParts internally.
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -080063 LogReader(std::string_view filename,
64 const Configuration *replay_configuration = nullptr);
Austin Schuh287d43d2020-12-04 20:19:33 -080065 LogReader(std::vector<LogFile> log_files,
Austin Schuh11d43732020-09-21 17:28:30 -070066 const Configuration *replay_configuration = nullptr);
James Kuszmaul7daef362019-12-31 18:28:17 -080067 ~LogReader();
Austin Schuhe309d2a2019-11-29 13:25:21 -080068
Austin Schuh6331ef92020-01-07 18:28:09 -080069 // Registers all the callbacks to send the log file data out on an event loop
70 // created in event_loop_factory. This also updates time to be at the start
71 // of the log file by running until the log file starts.
72 // Note: the configuration used in the factory should be configuration()
73 // below, but can be anything as long as the locations needed to send
74 // everything are available.
James Kuszmaul84ff3e52020-01-03 19:48:53 -080075 void Register(SimulatedEventLoopFactory *event_loop_factory);
Austin Schuh58646e22021-08-23 23:51:46 -070076 // Registers all the callbacks to send the log file data out to an event loop
77 // factory. This does not start replaying or change the current distributed
78 // time of the factory. It does change the monotonic clocks to be right.
79 void RegisterWithoutStarting(SimulatedEventLoopFactory *event_loop_factory);
Austin Schuh6331ef92020-01-07 18:28:09 -080080 // Creates an SimulatedEventLoopFactory accessible via event_loop_factory(),
81 // and then calls Register.
82 void Register();
83 // Registers callbacks for all the events after the log file starts. This is
84 // only useful when replaying live.
Austin Schuhe309d2a2019-11-29 13:25:21 -080085 void Register(EventLoop *event_loop);
Austin Schuh6331ef92020-01-07 18:28:09 -080086
Austin Schuh58646e22021-08-23 23:51:46 -070087 // Called whenever a log file starts for a node.
88 void OnStart(std::function<void()> fn);
89 void OnStart(const Node *node, std::function<void()> fn);
90 // Called whenever a log file ends for a node.
91 void OnEnd(std::function<void()> fn);
92 void OnEnd(const Node *node, std::function<void()> fn);
93
James Kuszmaul84ff3e52020-01-03 19:48:53 -080094 // Unregisters the senders. You only need to call this if you separately
95 // supplied an event loop or event loop factory and the lifetimes are such
96 // that they need to be explicitly destroyed before the LogReader destructor
97 // gets called.
Austin Schuhe309d2a2019-11-29 13:25:21 -080098 void Deregister();
99
Austin Schuh0c297012020-09-16 18:41:59 -0700100 // Returns the configuration being used for replay from the log file.
101 // Note that this may be different from the configuration actually used for
102 // handling events. You should generally only use this to create a
103 // SimulatedEventLoopFactory, and then get the configuration from there for
104 // everything else.
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800105 const Configuration *logged_configuration() const;
Austin Schuh11d43732020-09-21 17:28:30 -0700106 // Returns the configuration being used for replay from the log file.
107 // Note that this may be different from the configuration actually used for
108 // handling events. You should generally only use this to create a
109 // SimulatedEventLoopFactory, and then get the configuration from there for
110 // everything else.
Austin Schuh6f3babe2020-01-26 20:34:50 -0800111 // The pointer is invalidated whenever RemapLoggedChannel is called.
Austin Schuh15649d62019-12-28 16:36:38 -0800112 const Configuration *configuration() const;
113
Austin Schuh6f3babe2020-01-26 20:34:50 -0800114 // Returns the nodes that this log file was created on. This is a list of
Austin Schuh07676622021-01-21 18:59:17 -0800115 // pointers to a node in the nodes() list inside logged_configuration().
116 std::vector<const Node *> LoggedNodes() const;
Austin Schuhe309d2a2019-11-29 13:25:21 -0800117
118 // Returns the starting timestamp for the log file.
Austin Schuh11d43732020-09-21 17:28:30 -0700119 monotonic_clock::time_point monotonic_start_time(
120 const Node *node = nullptr) const;
121 realtime_clock::time_point realtime_start_time(
122 const Node *node = nullptr) const;
Austin Schuhe309d2a2019-11-29 13:25:21 -0800123
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800124 // Causes the logger to publish the provided channel on a different name so
125 // that replayed applications can publish on the proper channel name without
126 // interference. This operates on raw channel names, without any node or
127 // application specific mappings.
128 void RemapLoggedChannel(std::string_view name, std::string_view type,
Austin Schuh0de30f32020-12-06 12:44:28 -0800129 std::string_view add_prefix = "/original",
130 std::string_view new_type = "");
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800131 template <typename T>
132 void RemapLoggedChannel(std::string_view name,
Austin Schuh0de30f32020-12-06 12:44:28 -0800133 std::string_view add_prefix = "/original",
134 std::string_view new_type = "") {
135 RemapLoggedChannel(name, T::GetFullyQualifiedName(), add_prefix, new_type);
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800136 }
137
Austin Schuh01b4c352020-09-21 23:09:39 -0700138 // Remaps the provided channel, though this respects node mappings, and
139 // preserves them too. This makes it so if /aos -> /pi1/aos on one node,
140 // /original/aos -> /original/pi1/aos on the same node after renaming, just
Austin Schuh0de30f32020-12-06 12:44:28 -0800141 // like you would hope. If new_type is not empty, the new channel will use
142 // the provided type instead. This allows for renaming messages.
Austin Schuh01b4c352020-09-21 23:09:39 -0700143 //
144 // TODO(austin): If you have 2 nodes remapping something to the same channel,
145 // this doesn't handle that. No use cases exist yet for that, so it isn't
146 // being done yet.
147 void RemapLoggedChannel(std::string_view name, std::string_view type,
148 const Node *node,
Austin Schuh0de30f32020-12-06 12:44:28 -0800149 std::string_view add_prefix = "/original",
150 std::string_view new_type = "");
Brian Silvermande9f3ff2020-04-28 16:56:58 -0700151 template <typename T>
Austin Schuh01b4c352020-09-21 23:09:39 -0700152 void RemapLoggedChannel(std::string_view name, const Node *node,
Austin Schuh0de30f32020-12-06 12:44:28 -0800153 std::string_view add_prefix = "/original",
154 std::string_view new_type = "") {
155 RemapLoggedChannel(name, T::GetFullyQualifiedName(), node, add_prefix,
156 new_type);
Austin Schuh01b4c352020-09-21 23:09:39 -0700157 }
158
159 template <typename T>
160 bool HasChannel(std::string_view name, const Node *node = nullptr) {
Austin Schuh0ca51f32020-12-25 21:51:45 -0800161 return configuration::GetChannel(logged_configuration(), name,
Austin Schuh0de30f32020-12-06 12:44:28 -0800162 T::GetFullyQualifiedName(), "", node,
163 true) != nullptr;
Brian Silvermande9f3ff2020-04-28 16:56:58 -0700164 }
165
James Kuszmaul4f106fb2021-01-05 20:53:02 -0800166 // Returns true if the channel exists on the node and was logged.
167 template <typename T>
168 bool HasLoggedChannel(std::string_view name, const Node *node = nullptr) {
Austin Schuh5ee56872021-01-30 16:53:34 -0800169 const Channel *channel =
170 configuration::GetChannel(logged_configuration(), name,
171 T::GetFullyQualifiedName(), "", node, true);
James Kuszmaul4f106fb2021-01-05 20:53:02 -0800172 if (channel == nullptr) return false;
173 return channel->logger() != LoggerConfig::NOT_LOGGED;
174 }
175
James Kuszmaul84ff3e52020-01-03 19:48:53 -0800176 SimulatedEventLoopFactory *event_loop_factory() {
177 return event_loop_factory_;
178 }
179
Austin Schuh0ca51f32020-12-25 21:51:45 -0800180 std::string_view name() const { return log_files_[0].name; }
Austin Schuh0c297012020-09-16 18:41:59 -0700181
James Kuszmaul71a81932020-12-15 21:08:01 -0800182 // Set whether to exit the SimulatedEventLoopFactory when we finish reading
183 // the logfile.
184 void set_exit_on_finish(bool exit_on_finish) {
185 exit_on_finish_ = exit_on_finish;
186 }
187
Austin Schuhe309d2a2019-11-29 13:25:21 -0800188 private:
Austin Schuh58646e22021-08-23 23:51:46 -0700189 void Register(EventLoop *event_loop, const Node *node);
190
191 void RegisterDuringStartup(EventLoop *event_loop, const Node *node);
192
193 const Channel *RemapChannel(const EventLoop *event_loop, const Node *node,
Austin Schuh6f3babe2020-01-26 20:34:50 -0800194 const Channel *channel);
195
Austin Schuhe309d2a2019-11-29 13:25:21 -0800196 // Queues at least max_out_of_order_duration_ messages into channels_.
197 void QueueMessages();
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800198 // Handle constructing a configuration with all the additional remapped
199 // channels from calls to RemapLoggedChannel.
200 void MakeRemappedConfig();
Austin Schuhe309d2a2019-11-29 13:25:21 -0800201
Austin Schuh2f8fd752020-09-01 22:38:28 -0700202 // Returns the number of nodes.
203 size_t nodes_count() const {
204 return !configuration::MultiNode(logged_configuration())
205 ? 1u
206 : logged_configuration()->nodes()->size();
207 }
208
Austin Schuh287d43d2020-12-04 20:19:33 -0800209 const std::vector<LogFile> log_files_;
Austin Schuh6f3babe2020-01-26 20:34:50 -0800210
Austin Schuh969cd602021-01-03 00:09:45 -0800211 // Class to manage sending RemoteMessages on the provided node after the
212 // correct delay.
Austin Schuh5ee56872021-01-30 16:53:34 -0800213 class RemoteMessageSender {
Austin Schuh969cd602021-01-03 00:09:45 -0800214 public:
215 RemoteMessageSender(aos::Sender<message_bridge::RemoteMessage> sender,
216 EventLoop *event_loop);
217 RemoteMessageSender(RemoteMessageSender const &) = delete;
218 RemoteMessageSender &operator=(RemoteMessageSender const &) = delete;
219
220 // Sends the provided message. If monotonic_timestamp_time is min_time,
221 // send it immediately.
222 void Send(
223 FlatbufferDetachedBuffer<message_bridge::RemoteMessage> remote_message,
Austin Schuh58646e22021-08-23 23:51:46 -0700224 BootTimestamp monotonic_timestamp_time, size_t source_boot_count);
Austin Schuh969cd602021-01-03 00:09:45 -0800225
226 private:
227 // Handles actually sending the timestamp if we were delayed.
228 void SendTimestamp();
229 // Handles scheduling the timer to send at the correct time.
230 void ScheduleTimestamp();
231
232 EventLoop *event_loop_;
233 aos::Sender<message_bridge::RemoteMessage> sender_;
234 aos::TimerHandler *timer_;
235
236 // Time we are scheduled for, or min_time if we aren't scheduled.
237 monotonic_clock::time_point scheduled_time_ = monotonic_clock::min_time;
238
239 struct Timestamp {
240 Timestamp(FlatbufferDetachedBuffer<message_bridge::RemoteMessage>
241 new_remote_message,
242 monotonic_clock::time_point new_monotonic_timestamp_time)
243 : remote_message(std::move(new_remote_message)),
244 monotonic_timestamp_time(new_monotonic_timestamp_time) {}
245 FlatbufferDetachedBuffer<message_bridge::RemoteMessage> remote_message;
246 monotonic_clock::time_point monotonic_timestamp_time;
247 };
248
249 // List of messages to send. The timer works through them and then disables
250 // itself automatically.
251 std::deque<Timestamp> remote_timestamps_;
252 };
253
Austin Schuh6f3babe2020-01-26 20:34:50 -0800254 // State per node.
Austin Schuh858c9f32020-08-31 16:56:12 -0700255 class State {
256 public:
Austin Schuh58646e22021-08-23 23:51:46 -0700257 State(std::unique_ptr<TimestampMapper> timestamp_mapper, const Node *node);
Austin Schuh287d43d2020-12-04 20:19:33 -0800258
259 // Connects up the timestamp mappers.
260 void AddPeer(State *peer);
Austin Schuh6f3babe2020-01-26 20:34:50 -0800261
Austin Schuhe639ea12021-01-25 13:00:22 -0800262 TimestampMapper *timestamp_mapper() { return timestamp_mapper_.get(); }
263
Austin Schuhdda74ec2021-01-03 19:30:37 -0800264 // Returns the next sorted message with all the timestamps extracted and
265 // matched.
266 TimestampedMessage PopOldest();
Austin Schuh188eabe2020-12-29 23:41:13 -0800267
Austin Schuh858c9f32020-08-31 16:56:12 -0700268 // Returns the monotonic time of the oldest message.
Austin Schuh58646e22021-08-23 23:51:46 -0700269 BootTimestamp OldestMessageTime() const;
270
271 size_t boot_count() const {
272 // If we are replaying directly into an event loop, we can't reboot. So
273 // we will stay stuck on the 0th boot.
274 if (!node_event_loop_factory_) return 0u;
275 return node_event_loop_factory_->boot_count();
276 }
Austin Schuh858c9f32020-08-31 16:56:12 -0700277
278 // Primes the queues inside State. Should be called before calling
279 // OldestMessageTime.
280 void SeedSortedMessages();
Austin Schuh8bd96322020-02-13 21:18:22 -0800281
Austin Schuh58646e22021-08-23 23:51:46 -0700282 void SetupStartupTimer() {
283 const monotonic_clock::time_point start_time =
284 monotonic_start_time(boot_count());
285 if (start_time == monotonic_clock::min_time) {
286 LOG(ERROR)
287 << "No start time, skipping, please figure out when this happens";
288 RunOnStart();
289 return;
290 }
291 CHECK_GT(start_time, event_loop_->monotonic_now());
292 startup_timer_->Setup(start_time);
293 }
294
295 void set_startup_timer(TimerHandler *timer_handler) {
296 startup_timer_ = timer_handler;
297 if (startup_timer_) {
298 if (event_loop_->node() != nullptr) {
299 startup_timer_->set_name(absl::StrCat(
300 event_loop_->node()->name()->string_view(), "_startup"));
301 } else {
302 startup_timer_->set_name("startup");
303 }
304 }
305 }
306
Austin Schuh858c9f32020-08-31 16:56:12 -0700307 // Returns the starting time for this node.
Austin Schuh2dc8c7d2021-07-01 17:41:28 -0700308 monotonic_clock::time_point monotonic_start_time(size_t boot_count) const {
309 return timestamp_mapper_
310 ? timestamp_mapper_->monotonic_start_time(boot_count)
311 : monotonic_clock::min_time;
Austin Schuh858c9f32020-08-31 16:56:12 -0700312 }
Austin Schuh2dc8c7d2021-07-01 17:41:28 -0700313 realtime_clock::time_point realtime_start_time(size_t boot_count) const {
314 return timestamp_mapper_
315 ? timestamp_mapper_->realtime_start_time(boot_count)
316 : realtime_clock::min_time;
Austin Schuh858c9f32020-08-31 16:56:12 -0700317 }
318
319 // Sets the node event loop factory for replaying into a
320 // SimulatedEventLoopFactory. Returns the EventLoop to use.
Austin Schuh58646e22021-08-23 23:51:46 -0700321 void SetNodeEventLoopFactory(NodeEventLoopFactory *node_event_loop_factory);
Austin Schuh858c9f32020-08-31 16:56:12 -0700322
323 // Sets and gets the event loop to use.
324 void set_event_loop(EventLoop *event_loop) { event_loop_ = event_loop; }
325 EventLoop *event_loop() { return event_loop_; }
326
Austin Schuh58646e22021-08-23 23:51:46 -0700327 const Node *node() const { return node_; }
328
329 void Register(EventLoop *event_loop);
330
331 void OnStart(std::function<void()> fn);
332 void OnEnd(std::function<void()> fn);
333
Austin Schuh858c9f32020-08-31 16:56:12 -0700334 // Sets the current realtime offset from the monotonic clock for this node
335 // (if we are on a simulated event loop).
336 void SetRealtimeOffset(monotonic_clock::time_point monotonic_time,
337 realtime_clock::time_point realtime_time) {
338 if (node_event_loop_factory_ != nullptr) {
339 node_event_loop_factory_->SetRealtimeOffset(monotonic_time,
340 realtime_time);
341 }
342 }
343
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700344 // Returns the MessageHeader sender to log delivery timestamps to for the
345 // provided remote node.
Austin Schuh61e973f2021-02-21 21:43:56 -0800346 RemoteMessageSender *RemoteTimestampSender(const Channel *channel,
347 const Connection *connection);
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700348
Austin Schuh858c9f32020-08-31 16:56:12 -0700349 // Converts a timestamp from the monotonic clock on this node to the
350 // distributed clock.
351 distributed_clock::time_point ToDistributedClock(
352 monotonic_clock::time_point time) {
353 return node_event_loop_factory_->ToDistributedClock(time);
354 }
355
Austin Schuh858c9f32020-08-31 16:56:12 -0700356 // Returns the current time on the remote node which sends messages on
357 // channel_index.
Austin Schuh58646e22021-08-23 23:51:46 -0700358 BootTimestamp monotonic_remote_now(size_t channel_index) {
359 State *s = channel_source_state_[channel_index];
360 return BootTimestamp{
361 .boot = s->boot_count(),
362 .time = s->node_event_loop_factory_->monotonic_now()};
Austin Schuh858c9f32020-08-31 16:56:12 -0700363 }
364
Austin Schuh5ee56872021-01-30 16:53:34 -0800365 // Returns the start time of the remote for the provided channel.
366 monotonic_clock::time_point monotonic_remote_start_time(
Austin Schuh58646e22021-08-23 23:51:46 -0700367 size_t boot_count, size_t channel_index) {
Austin Schuh2dc8c7d2021-07-01 17:41:28 -0700368 return channel_source_state_[channel_index]->monotonic_start_time(
369 boot_count);
Austin Schuh5ee56872021-01-30 16:53:34 -0800370 }
371
Austin Schuh58646e22021-08-23 23:51:46 -0700372 void DestroyEventLoop() { event_loop_unique_ptr_.reset(); }
373
374 EventLoop *MakeEventLoop() {
375 CHECK(!event_loop_unique_ptr_);
376 event_loop_unique_ptr_ =
377 node_event_loop_factory_->MakeEventLoop("log_reader");
378 return event_loop_unique_ptr_.get();
379 }
380
Austin Schuh2f8fd752020-09-01 22:38:28 -0700381 distributed_clock::time_point RemoteToDistributedClock(
382 size_t channel_index, monotonic_clock::time_point time) {
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700383 return channel_source_state_[channel_index]
384 ->node_event_loop_factory_->ToDistributedClock(time);
Austin Schuh2f8fd752020-09-01 22:38:28 -0700385 }
386
387 const Node *remote_node(size_t channel_index) {
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700388 return channel_source_state_[channel_index]
389 ->node_event_loop_factory_->node();
Austin Schuh2f8fd752020-09-01 22:38:28 -0700390 }
391
392 monotonic_clock::time_point monotonic_now() {
393 return node_event_loop_factory_->monotonic_now();
394 }
395
Austin Schuh858c9f32020-08-31 16:56:12 -0700396 // Sets the number of channels.
397 void SetChannelCount(size_t count);
398
399 // Sets the sender, filter, and target factory for a channel.
Austin Schuh969cd602021-01-03 00:09:45 -0800400 void SetChannel(size_t logged_channel_index, size_t factory_channel_index,
401 std::unique_ptr<RawSender> sender,
402 message_bridge::NoncausalOffsetEstimator *filter,
Austin Schuh58646e22021-08-23 23:51:46 -0700403 bool is_forwarded, State *source_state);
404
405 void SetRemoteTimestampSender(size_t logged_channel_index,
406 RemoteMessageSender *remote_timestamp_sender);
407
408 void RunOnStart();
409 void RunOnEnd();
Austin Schuh858c9f32020-08-31 16:56:12 -0700410
Austin Schuh858c9f32020-08-31 16:56:12 -0700411 // Unregisters everything so we can destory the event loop.
Austin Schuh58646e22021-08-23 23:51:46 -0700412 // TODO(austin): Is this needed? OnShutdown should be able to serve this
413 // need.
Austin Schuh858c9f32020-08-31 16:56:12 -0700414 void Deregister();
415
416 // Sets the current TimerHandle for the replay callback.
417 void set_timer_handler(TimerHandler *timer_handler) {
418 timer_handler_ = timer_handler;
Austin Schuh58646e22021-08-23 23:51:46 -0700419 if (timer_handler_) {
420 if (event_loop_->node() != nullptr) {
421 timer_handler_->set_name(absl::StrCat(
422 event_loop_->node()->name()->string_view(), "_main"));
423 } else {
424 timer_handler_->set_name("main");
425 }
426 }
Austin Schuh858c9f32020-08-31 16:56:12 -0700427 }
428
429 // Sets the next wakeup time on the replay callback.
430 void Setup(monotonic_clock::time_point next_time) {
431 timer_handler_->Setup(next_time);
432 }
433
434 // Sends a buffer on the provided channel index.
Austin Schuh287d43d2020-12-04 20:19:33 -0800435 bool Send(const TimestampedMessage &timestamped_message);
Austin Schuh858c9f32020-08-31 16:56:12 -0700436
437 // Returns a debug string for the channel merger.
Austin Schuh2f8fd752020-09-01 22:38:28 -0700438 std::string DebugString() const {
Austin Schuh287d43d2020-12-04 20:19:33 -0800439 if (!timestamp_mapper_) {
Austin Schuhe639ea12021-01-25 13:00:22 -0800440 return "";
Austin Schuh287d43d2020-12-04 20:19:33 -0800441 }
Austin Schuhe639ea12021-01-25 13:00:22 -0800442 return timestamp_mapper_->DebugString();
Austin Schuh2f8fd752020-09-01 22:38:28 -0700443 }
Austin Schuh858c9f32020-08-31 16:56:12 -0700444
Austin Schuh58646e22021-08-23 23:51:46 -0700445 void ClearRemoteTimestampSenders() {
446 channel_timestamp_loggers_.clear();
447 timestamp_loggers_.clear();
448 }
449
Austin Schuh858c9f32020-08-31 16:56:12 -0700450 private:
451 // Log file.
Austin Schuh287d43d2020-12-04 20:19:33 -0800452 std::unique_ptr<TimestampMapper> timestamp_mapper_;
Austin Schuh858c9f32020-08-31 16:56:12 -0700453
Austin Schuh858c9f32020-08-31 16:56:12 -0700454 // Senders.
455 std::vector<std::unique_ptr<RawSender>> channels_;
Austin Schuh969cd602021-01-03 00:09:45 -0800456 std::vector<RemoteMessageSender *> remote_timestamp_senders_;
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700457 // The mapping from logged channel index to sent channel index. Needed for
458 // sending out MessageHeaders.
459 std::vector<int> factory_channel_index_;
460
Austin Schuh9942bae2021-01-07 22:06:44 -0800461 struct ContiguousSentTimestamp {
462 // Most timestamps make it through the network, so it saves a ton of
463 // memory and CPU to store the start and end, and search for valid ranges.
464 // For one of the logs I looked at, we had 2 ranges for 4 days.
465 //
466 // Save monotonic times as well to help if a queue index ever wraps. Odds
467 // are very low, but doesn't hurt.
468 //
469 // The starting time and matching queue index.
470 monotonic_clock::time_point starting_monotonic_event_time =
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700471 monotonic_clock::min_time;
Austin Schuh9942bae2021-01-07 22:06:44 -0800472 uint32_t starting_queue_index = 0xffffffff;
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700473
Austin Schuh9942bae2021-01-07 22:06:44 -0800474 // Ending time and queue index.
475 monotonic_clock::time_point ending_monotonic_event_time =
476 monotonic_clock::max_time;
477 uint32_t ending_queue_index = 0xffffffff;
478
479 // The queue index that the first message was *actually* sent with. The
480 // queue indices are assumed to be contiguous through this range.
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700481 uint32_t actual_queue_index = 0xffffffff;
482 };
483
484 // Stores all the timestamps that have been sent on this channel. This is
485 // only done for channels which are forwarded and on the node which
Austin Schuh9942bae2021-01-07 22:06:44 -0800486 // initially sends the message. Compress using ranges and offsets.
487 std::vector<std::unique_ptr<std::vector<ContiguousSentTimestamp>>>
488 queue_index_map_;
Austin Schuh858c9f32020-08-31 16:56:12 -0700489
490 // Factory (if we are in sim) that this loop was created on.
491 NodeEventLoopFactory *node_event_loop_factory_ = nullptr;
492 std::unique_ptr<EventLoop> event_loop_unique_ptr_;
493 // Event loop.
Austin Schuh58646e22021-08-23 23:51:46 -0700494 const Node *node_ = nullptr;
Austin Schuh858c9f32020-08-31 16:56:12 -0700495 EventLoop *event_loop_ = nullptr;
496 // And timer used to send messages.
Austin Schuh58646e22021-08-23 23:51:46 -0700497 TimerHandler *timer_handler_ = nullptr;
498 TimerHandler *startup_timer_ = nullptr;
Austin Schuh858c9f32020-08-31 16:56:12 -0700499
Austin Schuh8bd96322020-02-13 21:18:22 -0800500 // Filters (or nullptr if it isn't a forwarded channel) for each channel.
501 // This corresponds to the object which is shared among all the channels
502 // going between 2 nodes. The second element in the tuple indicates if this
503 // is the primary direction or not.
Austin Schuh2f8fd752020-09-01 22:38:28 -0700504 std::vector<message_bridge::NoncausalOffsetEstimator *> filters_;
Austin Schuh8bd96322020-02-13 21:18:22 -0800505
506 // List of NodeEventLoopFactorys (or nullptr if it isn't a forwarded
507 // channel) which correspond to the originating node.
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700508 std::vector<State *> channel_source_state_;
509
Austin Schuh61e973f2021-02-21 21:43:56 -0800510 // This is a cache for channel, connection mapping to the corresponding
511 // sender.
512 absl::btree_map<std::pair<const Channel *, const Connection *>,
513 std::shared_ptr<RemoteMessageSender>>
514 channel_timestamp_loggers_;
515
516 // Mapping from resolved RemoteMessage channel to RemoteMessage sender. This
517 // is the channel that timestamps are published to.
518 absl::btree_map<const Channel *, std::shared_ptr<RemoteMessageSender>>
519 timestamp_loggers_;
Austin Schuh58646e22021-08-23 23:51:46 -0700520
521 std::vector<std::function<void()>> on_starts_;
522 std::vector<std::function<void()>> on_ends_;
523
524 bool stopped_ = false;
525 bool started_ = false;
Austin Schuh6f3babe2020-01-26 20:34:50 -0800526 };
527
Austin Schuh8bd96322020-02-13 21:18:22 -0800528 // Node index -> State.
529 std::vector<std::unique_ptr<State>> states_;
530
531 // Creates the requested filter if it doesn't exist, regardless of whether
532 // these nodes can actually communicate directly. The second return value
533 // reports if this is the primary direction or not.
Austin Schuh2f8fd752020-09-01 22:38:28 -0700534 message_bridge::NoncausalOffsetEstimator *GetFilter(const Node *node_a,
535 const Node *node_b);
Austin Schuh8bd96322020-02-13 21:18:22 -0800536
Austin Schuh8bd96322020-02-13 21:18:22 -0800537 // List of filters for a connection. The pointer to the first node will be
538 // less than the second node.
Austin Schuh0ca1fd32020-12-18 22:53:05 -0800539 std::unique_ptr<message_bridge::MultiNodeNoncausalOffsetEstimator> filters_;
Austin Schuh8bd96322020-02-13 21:18:22 -0800540
James Kuszmaul84ff3e52020-01-03 19:48:53 -0800541 std::unique_ptr<FlatbufferDetachedBuffer<Configuration>>
542 remapped_configuration_buffer_;
543
James Kuszmaul84ff3e52020-01-03 19:48:53 -0800544 std::unique_ptr<SimulatedEventLoopFactory> event_loop_factory_unique_ptr_;
545 SimulatedEventLoopFactory *event_loop_factory_ = nullptr;
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800546
547 // Map of channel indices to new name. The channel index will be an index into
548 // logged_configuration(), and the string key will be the name of the channel
549 // to send on instead of the logged channel name.
Austin Schuh0de30f32020-12-06 12:44:28 -0800550 struct RemappedChannel {
551 std::string remapped_name;
552 std::string new_type;
553 };
554 std::map<size_t, RemappedChannel> remapped_channels_;
Austin Schuh01b4c352020-09-21 23:09:39 -0700555 std::vector<MapT> maps_;
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800556
Austin Schuh6f3babe2020-01-26 20:34:50 -0800557 // Number of nodes which still have data to send. This is used to figure out
558 // when to exit.
559 size_t live_nodes_ = 0;
560
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800561 const Configuration *remapped_configuration_ = nullptr;
562 const Configuration *replay_configuration_ = nullptr;
Austin Schuhcde938c2020-02-02 17:30:07 -0800563
564 // If true, the replay timer will ignore any missing data. This is used
565 // during startup when we are bootstrapping everything and trying to get to
566 // the start of all the log files.
567 bool ignore_missing_data_ = false;
James Kuszmaul71a81932020-12-15 21:08:01 -0800568
569 // Whether to exit the SimulatedEventLoop when we finish reading the logs.
570 bool exit_on_finish_ = true;
Austin Schuhe309d2a2019-11-29 13:25:21 -0800571};
572
573} // namespace logger
574} // namespace aos
575
Austin Schuhb06f03b2021-02-17 22:00:37 -0800576#endif // AOS_EVENTS_LOGGING_LOG_READER_H_