blob: 3eebba71e33183c76651c70b226eb7cebbe35651 [file] [log] [blame]
Austin Schuhb06f03b2021-02-17 22:00:37 -08001#ifndef AOS_EVENTS_LOGGING_LOG_READER_H_
2#define AOS_EVENTS_LOGGING_LOG_READER_H_
Austin Schuhe309d2a2019-11-29 13:25:21 -08003
Austin Schuh8bd96322020-02-13 21:18:22 -08004#include <chrono>
Austin Schuhe309d2a2019-11-29 13:25:21 -08005#include <deque>
Austin Schuh05b70472020-01-01 17:11:17 -08006#include <string_view>
Austin Schuh2f8fd752020-09-01 22:38:28 -07007#include <tuple>
Austin Schuh6f3babe2020-01-26 20:34:50 -08008#include <vector>
Austin Schuhe309d2a2019-11-29 13:25:21 -08009
Austin Schuhe309d2a2019-11-29 13:25:21 -080010#include "aos/events/event_loop.h"
Austin Schuhf6f9bf32020-10-11 14:37:43 -070011#include "aos/events/logging/logfile_sorting.h"
Austin Schuha36c8902019-12-30 18:07:15 -080012#include "aos/events/logging/logfile_utils.h"
James Kuszmaul38735e82019-12-07 16:42:06 -080013#include "aos/events/logging/logger_generated.h"
Austin Schuh92547522019-12-28 14:33:43 -080014#include "aos/events/simulated_event_loop.h"
Austin Schuh2f8fd752020-09-01 22:38:28 -070015#include "aos/network/message_bridge_server_generated.h"
Austin Schuh0ca1fd32020-12-18 22:53:05 -080016#include "aos/network/multinode_timestamp_filter.h"
Austin Schuh0de30f32020-12-06 12:44:28 -080017#include "aos/network/remote_message_generated.h"
Austin Schuh8bd96322020-02-13 21:18:22 -080018#include "aos/network/timestamp_filter.h"
Austin Schuhe309d2a2019-11-29 13:25:21 -080019#include "aos/time/time.h"
Austin Schuh4385b142021-03-14 21:31:13 -070020#include "aos/uuid.h"
Austin Schuhe309d2a2019-11-29 13:25:21 -080021#include "flatbuffers/flatbuffers.h"
22
23namespace aos {
24namespace logger {
25
Austin Schuh6f3babe2020-01-26 20:34:50 -080026// We end up with one of the following 3 log file types.
27//
28// Single node logged as the source node.
29// -> Replayed just on the source node.
30//
31// Forwarding timestamps only logged from the perspective of the destination
32// node.
33// -> Matched with data on source node and logged.
34//
35// Forwarding timestamps with data logged as the destination node.
36// -> Replayed just as the destination
37// -> Replayed as the source (Much harder, ordering is not defined)
38//
39// Duplicate data logged. -> CHECK that it matches and explode otherwise.
40//
41// This can be boiled down to a set of constraints and tools.
42//
43// 1) Forwarding timestamps and data need to be logged separately.
44// 2) Any forwarded data logged on the destination node needs to be logged
45// separately such that it can be sorted.
46//
47// 1) Log reader needs to be able to sort a list of log files.
48// 2) Log reader needs to be able to merge sorted lists of log files.
49// 3) Log reader needs to be able to match timestamps with messages.
50//
51// We also need to be able to generate multiple views of a log file depending on
52// the target.
53
Austin Schuhe309d2a2019-11-29 13:25:21 -080054// Replays all the channels in the logfile to the event loop.
55class LogReader {
56 public:
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -080057 // If you want to supply a new configuration that will be used for replay
58 // (e.g., to change message rates, or to populate an updated schema), then
59 // pass it in here. It must provide all the channels that the original logged
60 // config did.
Austin Schuh6f3babe2020-01-26 20:34:50 -080061 //
Austin Schuh287d43d2020-12-04 20:19:33 -080062 // The single file constructor calls SortParts internally.
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -080063 LogReader(std::string_view filename,
64 const Configuration *replay_configuration = nullptr);
Austin Schuh287d43d2020-12-04 20:19:33 -080065 LogReader(std::vector<LogFile> log_files,
Austin Schuh11d43732020-09-21 17:28:30 -070066 const Configuration *replay_configuration = nullptr);
James Kuszmaul7daef362019-12-31 18:28:17 -080067 ~LogReader();
Austin Schuhe309d2a2019-11-29 13:25:21 -080068
Austin Schuh6331ef92020-01-07 18:28:09 -080069 // Registers all the callbacks to send the log file data out on an event loop
70 // created in event_loop_factory. This also updates time to be at the start
71 // of the log file by running until the log file starts.
72 // Note: the configuration used in the factory should be configuration()
73 // below, but can be anything as long as the locations needed to send
74 // everything are available.
James Kuszmaul84ff3e52020-01-03 19:48:53 -080075 void Register(SimulatedEventLoopFactory *event_loop_factory);
Austin Schuh58646e22021-08-23 23:51:46 -070076 // Registers all the callbacks to send the log file data out to an event loop
77 // factory. This does not start replaying or change the current distributed
78 // time of the factory. It does change the monotonic clocks to be right.
79 void RegisterWithoutStarting(SimulatedEventLoopFactory *event_loop_factory);
Austin Schuh6331ef92020-01-07 18:28:09 -080080 // Creates an SimulatedEventLoopFactory accessible via event_loop_factory(),
81 // and then calls Register.
82 void Register();
83 // Registers callbacks for all the events after the log file starts. This is
84 // only useful when replaying live.
Austin Schuhe309d2a2019-11-29 13:25:21 -080085 void Register(EventLoop *event_loop);
Austin Schuh6331ef92020-01-07 18:28:09 -080086
Austin Schuh58646e22021-08-23 23:51:46 -070087 // Called whenever a log file starts for a node.
88 void OnStart(std::function<void()> fn);
89 void OnStart(const Node *node, std::function<void()> fn);
90 // Called whenever a log file ends for a node.
91 void OnEnd(std::function<void()> fn);
92 void OnEnd(const Node *node, std::function<void()> fn);
93
James Kuszmaul84ff3e52020-01-03 19:48:53 -080094 // Unregisters the senders. You only need to call this if you separately
95 // supplied an event loop or event loop factory and the lifetimes are such
96 // that they need to be explicitly destroyed before the LogReader destructor
97 // gets called.
Austin Schuhe309d2a2019-11-29 13:25:21 -080098 void Deregister();
99
Austin Schuh0c297012020-09-16 18:41:59 -0700100 // Returns the configuration being used for replay from the log file.
101 // Note that this may be different from the configuration actually used for
102 // handling events. You should generally only use this to create a
103 // SimulatedEventLoopFactory, and then get the configuration from there for
104 // everything else.
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800105 const Configuration *logged_configuration() const;
Austin Schuh11d43732020-09-21 17:28:30 -0700106 // Returns the configuration being used for replay from the log file.
107 // Note that this may be different from the configuration actually used for
108 // handling events. You should generally only use this to create a
109 // SimulatedEventLoopFactory, and then get the configuration from there for
110 // everything else.
Austin Schuh6f3babe2020-01-26 20:34:50 -0800111 // The pointer is invalidated whenever RemapLoggedChannel is called.
Austin Schuh15649d62019-12-28 16:36:38 -0800112 const Configuration *configuration() const;
113
Austin Schuh6f3babe2020-01-26 20:34:50 -0800114 // Returns the nodes that this log file was created on. This is a list of
Austin Schuh07676622021-01-21 18:59:17 -0800115 // pointers to a node in the nodes() list inside logged_configuration().
116 std::vector<const Node *> LoggedNodes() const;
Austin Schuhe309d2a2019-11-29 13:25:21 -0800117
118 // Returns the starting timestamp for the log file.
Austin Schuh11d43732020-09-21 17:28:30 -0700119 monotonic_clock::time_point monotonic_start_time(
120 const Node *node = nullptr) const;
121 realtime_clock::time_point realtime_start_time(
122 const Node *node = nullptr) const;
Austin Schuhe309d2a2019-11-29 13:25:21 -0800123
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800124 // Causes the logger to publish the provided channel on a different name so
125 // that replayed applications can publish on the proper channel name without
126 // interference. This operates on raw channel names, without any node or
127 // application specific mappings.
128 void RemapLoggedChannel(std::string_view name, std::string_view type,
Austin Schuh0de30f32020-12-06 12:44:28 -0800129 std::string_view add_prefix = "/original",
130 std::string_view new_type = "");
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800131 template <typename T>
132 void RemapLoggedChannel(std::string_view name,
Austin Schuh0de30f32020-12-06 12:44:28 -0800133 std::string_view add_prefix = "/original",
134 std::string_view new_type = "") {
135 RemapLoggedChannel(name, T::GetFullyQualifiedName(), add_prefix, new_type);
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800136 }
137
Austin Schuh01b4c352020-09-21 23:09:39 -0700138 // Remaps the provided channel, though this respects node mappings, and
139 // preserves them too. This makes it so if /aos -> /pi1/aos on one node,
140 // /original/aos -> /original/pi1/aos on the same node after renaming, just
Austin Schuh0de30f32020-12-06 12:44:28 -0800141 // like you would hope. If new_type is not empty, the new channel will use
142 // the provided type instead. This allows for renaming messages.
Austin Schuh01b4c352020-09-21 23:09:39 -0700143 //
144 // TODO(austin): If you have 2 nodes remapping something to the same channel,
145 // this doesn't handle that. No use cases exist yet for that, so it isn't
146 // being done yet.
147 void RemapLoggedChannel(std::string_view name, std::string_view type,
148 const Node *node,
Austin Schuh0de30f32020-12-06 12:44:28 -0800149 std::string_view add_prefix = "/original",
150 std::string_view new_type = "");
Brian Silvermande9f3ff2020-04-28 16:56:58 -0700151 template <typename T>
Austin Schuh01b4c352020-09-21 23:09:39 -0700152 void RemapLoggedChannel(std::string_view name, const Node *node,
Austin Schuh0de30f32020-12-06 12:44:28 -0800153 std::string_view add_prefix = "/original",
154 std::string_view new_type = "") {
155 RemapLoggedChannel(name, T::GetFullyQualifiedName(), node, add_prefix,
156 new_type);
Austin Schuh01b4c352020-09-21 23:09:39 -0700157 }
158
159 template <typename T>
160 bool HasChannel(std::string_view name, const Node *node = nullptr) {
Austin Schuh0ca51f32020-12-25 21:51:45 -0800161 return configuration::GetChannel(logged_configuration(), name,
Austin Schuh0de30f32020-12-06 12:44:28 -0800162 T::GetFullyQualifiedName(), "", node,
163 true) != nullptr;
Brian Silvermande9f3ff2020-04-28 16:56:58 -0700164 }
165
Austin Schuh82529062021-12-08 12:09:52 -0800166 template <typename T>
167 void MaybeRemapLoggedChannel(std::string_view name,
168 const Node *node = nullptr) {
169 if (HasChannel<T>(name, node)) {
170 RemapLoggedChannel<T>(name, node);
171 }
172 }
173
James Kuszmaul4f106fb2021-01-05 20:53:02 -0800174 // Returns true if the channel exists on the node and was logged.
175 template <typename T>
176 bool HasLoggedChannel(std::string_view name, const Node *node = nullptr) {
Austin Schuh5ee56872021-01-30 16:53:34 -0800177 const Channel *channel =
178 configuration::GetChannel(logged_configuration(), name,
179 T::GetFullyQualifiedName(), "", node, true);
James Kuszmaul4f106fb2021-01-05 20:53:02 -0800180 if (channel == nullptr) return false;
181 return channel->logger() != LoggerConfig::NOT_LOGGED;
182 }
183
Austin Schuh1c227352021-09-17 12:53:54 -0700184 // Returns a list of all the original channels from remapping.
185 std::vector<const Channel *> RemappedChannels() const;
186
James Kuszmaul84ff3e52020-01-03 19:48:53 -0800187 SimulatedEventLoopFactory *event_loop_factory() {
188 return event_loop_factory_;
189 }
190
Austin Schuh0ca51f32020-12-25 21:51:45 -0800191 std::string_view name() const { return log_files_[0].name; }
Austin Schuh0c297012020-09-16 18:41:59 -0700192
James Kuszmaul71a81932020-12-15 21:08:01 -0800193 // Set whether to exit the SimulatedEventLoopFactory when we finish reading
194 // the logfile.
195 void set_exit_on_finish(bool exit_on_finish) {
196 exit_on_finish_ = exit_on_finish;
197 }
198
Austin Schuhe309d2a2019-11-29 13:25:21 -0800199 private:
Austin Schuh58646e22021-08-23 23:51:46 -0700200 void Register(EventLoop *event_loop, const Node *node);
201
202 void RegisterDuringStartup(EventLoop *event_loop, const Node *node);
203
204 const Channel *RemapChannel(const EventLoop *event_loop, const Node *node,
Austin Schuh6f3babe2020-01-26 20:34:50 -0800205 const Channel *channel);
206
Austin Schuhe309d2a2019-11-29 13:25:21 -0800207 // Queues at least max_out_of_order_duration_ messages into channels_.
208 void QueueMessages();
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800209 // Handle constructing a configuration with all the additional remapped
210 // channels from calls to RemapLoggedChannel.
211 void MakeRemappedConfig();
Austin Schuhe309d2a2019-11-29 13:25:21 -0800212
Austin Schuh2f8fd752020-09-01 22:38:28 -0700213 // Returns the number of nodes.
214 size_t nodes_count() const {
215 return !configuration::MultiNode(logged_configuration())
216 ? 1u
217 : logged_configuration()->nodes()->size();
218 }
219
Austin Schuh287d43d2020-12-04 20:19:33 -0800220 const std::vector<LogFile> log_files_;
Austin Schuh6f3babe2020-01-26 20:34:50 -0800221
Austin Schuh969cd602021-01-03 00:09:45 -0800222 // Class to manage sending RemoteMessages on the provided node after the
223 // correct delay.
Austin Schuh5ee56872021-01-30 16:53:34 -0800224 class RemoteMessageSender {
Austin Schuh969cd602021-01-03 00:09:45 -0800225 public:
226 RemoteMessageSender(aos::Sender<message_bridge::RemoteMessage> sender,
227 EventLoop *event_loop);
228 RemoteMessageSender(RemoteMessageSender const &) = delete;
229 RemoteMessageSender &operator=(RemoteMessageSender const &) = delete;
230
231 // Sends the provided message. If monotonic_timestamp_time is min_time,
232 // send it immediately.
233 void Send(
234 FlatbufferDetachedBuffer<message_bridge::RemoteMessage> remote_message,
Austin Schuh58646e22021-08-23 23:51:46 -0700235 BootTimestamp monotonic_timestamp_time, size_t source_boot_count);
Austin Schuh969cd602021-01-03 00:09:45 -0800236
237 private:
238 // Handles actually sending the timestamp if we were delayed.
239 void SendTimestamp();
240 // Handles scheduling the timer to send at the correct time.
241 void ScheduleTimestamp();
242
243 EventLoop *event_loop_;
244 aos::Sender<message_bridge::RemoteMessage> sender_;
245 aos::TimerHandler *timer_;
246
247 // Time we are scheduled for, or min_time if we aren't scheduled.
248 monotonic_clock::time_point scheduled_time_ = monotonic_clock::min_time;
249
250 struct Timestamp {
251 Timestamp(FlatbufferDetachedBuffer<message_bridge::RemoteMessage>
252 new_remote_message,
253 monotonic_clock::time_point new_monotonic_timestamp_time)
254 : remote_message(std::move(new_remote_message)),
255 monotonic_timestamp_time(new_monotonic_timestamp_time) {}
256 FlatbufferDetachedBuffer<message_bridge::RemoteMessage> remote_message;
257 monotonic_clock::time_point monotonic_timestamp_time;
258 };
259
260 // List of messages to send. The timer works through them and then disables
261 // itself automatically.
262 std::deque<Timestamp> remote_timestamps_;
263 };
264
Austin Schuh6f3babe2020-01-26 20:34:50 -0800265 // State per node.
Austin Schuh858c9f32020-08-31 16:56:12 -0700266 class State {
267 public:
Austin Schuh58646e22021-08-23 23:51:46 -0700268 State(std::unique_ptr<TimestampMapper> timestamp_mapper, const Node *node);
Austin Schuh287d43d2020-12-04 20:19:33 -0800269
270 // Connects up the timestamp mappers.
271 void AddPeer(State *peer);
Austin Schuh6f3babe2020-01-26 20:34:50 -0800272
Austin Schuhe639ea12021-01-25 13:00:22 -0800273 TimestampMapper *timestamp_mapper() { return timestamp_mapper_.get(); }
274
Austin Schuhdda74ec2021-01-03 19:30:37 -0800275 // Returns the next sorted message with all the timestamps extracted and
276 // matched.
277 TimestampedMessage PopOldest();
Austin Schuh188eabe2020-12-29 23:41:13 -0800278
Austin Schuh858c9f32020-08-31 16:56:12 -0700279 // Returns the monotonic time of the oldest message.
Austin Schuh58646e22021-08-23 23:51:46 -0700280 BootTimestamp OldestMessageTime() const;
281
282 size_t boot_count() const {
283 // If we are replaying directly into an event loop, we can't reboot. So
284 // we will stay stuck on the 0th boot.
285 if (!node_event_loop_factory_) return 0u;
286 return node_event_loop_factory_->boot_count();
287 }
Austin Schuh858c9f32020-08-31 16:56:12 -0700288
289 // Primes the queues inside State. Should be called before calling
290 // OldestMessageTime.
291 void SeedSortedMessages();
Austin Schuh8bd96322020-02-13 21:18:22 -0800292
Austin Schuh58646e22021-08-23 23:51:46 -0700293 void SetupStartupTimer() {
294 const monotonic_clock::time_point start_time =
295 monotonic_start_time(boot_count());
296 if (start_time == monotonic_clock::min_time) {
297 LOG(ERROR)
298 << "No start time, skipping, please figure out when this happens";
299 RunOnStart();
300 return;
301 }
James Kuszmaul57d39742021-10-15 20:07:34 -0700302 CHECK_GE(start_time, event_loop_->monotonic_now());
Austin Schuh58646e22021-08-23 23:51:46 -0700303 startup_timer_->Setup(start_time);
304 }
305
306 void set_startup_timer(TimerHandler *timer_handler) {
307 startup_timer_ = timer_handler;
308 if (startup_timer_) {
309 if (event_loop_->node() != nullptr) {
310 startup_timer_->set_name(absl::StrCat(
311 event_loop_->node()->name()->string_view(), "_startup"));
312 } else {
313 startup_timer_->set_name("startup");
314 }
315 }
316 }
317
Austin Schuh858c9f32020-08-31 16:56:12 -0700318 // Returns the starting time for this node.
Austin Schuh2dc8c7d2021-07-01 17:41:28 -0700319 monotonic_clock::time_point monotonic_start_time(size_t boot_count) const {
320 return timestamp_mapper_
321 ? timestamp_mapper_->monotonic_start_time(boot_count)
322 : monotonic_clock::min_time;
Austin Schuh858c9f32020-08-31 16:56:12 -0700323 }
Austin Schuh2dc8c7d2021-07-01 17:41:28 -0700324 realtime_clock::time_point realtime_start_time(size_t boot_count) const {
325 return timestamp_mapper_
326 ? timestamp_mapper_->realtime_start_time(boot_count)
327 : realtime_clock::min_time;
Austin Schuh858c9f32020-08-31 16:56:12 -0700328 }
329
330 // Sets the node event loop factory for replaying into a
331 // SimulatedEventLoopFactory. Returns the EventLoop to use.
Austin Schuh58646e22021-08-23 23:51:46 -0700332 void SetNodeEventLoopFactory(NodeEventLoopFactory *node_event_loop_factory);
Austin Schuh858c9f32020-08-31 16:56:12 -0700333
334 // Sets and gets the event loop to use.
335 void set_event_loop(EventLoop *event_loop) { event_loop_ = event_loop; }
336 EventLoop *event_loop() { return event_loop_; }
337
Austin Schuh58646e22021-08-23 23:51:46 -0700338 const Node *node() const { return node_; }
339
340 void Register(EventLoop *event_loop);
341
342 void OnStart(std::function<void()> fn);
343 void OnEnd(std::function<void()> fn);
344
Austin Schuh858c9f32020-08-31 16:56:12 -0700345 // Sets the current realtime offset from the monotonic clock for this node
346 // (if we are on a simulated event loop).
347 void SetRealtimeOffset(monotonic_clock::time_point monotonic_time,
348 realtime_clock::time_point realtime_time) {
349 if (node_event_loop_factory_ != nullptr) {
350 node_event_loop_factory_->SetRealtimeOffset(monotonic_time,
351 realtime_time);
352 }
353 }
354
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700355 // Returns the MessageHeader sender to log delivery timestamps to for the
356 // provided remote node.
Austin Schuh61e973f2021-02-21 21:43:56 -0800357 RemoteMessageSender *RemoteTimestampSender(const Channel *channel,
358 const Connection *connection);
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700359
Austin Schuh858c9f32020-08-31 16:56:12 -0700360 // Converts a timestamp from the monotonic clock on this node to the
361 // distributed clock.
362 distributed_clock::time_point ToDistributedClock(
363 monotonic_clock::time_point time) {
364 return node_event_loop_factory_->ToDistributedClock(time);
365 }
366
Austin Schuh858c9f32020-08-31 16:56:12 -0700367 // Returns the current time on the remote node which sends messages on
368 // channel_index.
Austin Schuh58646e22021-08-23 23:51:46 -0700369 BootTimestamp monotonic_remote_now(size_t channel_index) {
370 State *s = channel_source_state_[channel_index];
371 return BootTimestamp{
372 .boot = s->boot_count(),
373 .time = s->node_event_loop_factory_->monotonic_now()};
Austin Schuh858c9f32020-08-31 16:56:12 -0700374 }
375
Austin Schuh5ee56872021-01-30 16:53:34 -0800376 // Returns the start time of the remote for the provided channel.
377 monotonic_clock::time_point monotonic_remote_start_time(
Austin Schuh58646e22021-08-23 23:51:46 -0700378 size_t boot_count, size_t channel_index) {
Austin Schuh2dc8c7d2021-07-01 17:41:28 -0700379 return channel_source_state_[channel_index]->monotonic_start_time(
380 boot_count);
Austin Schuh5ee56872021-01-30 16:53:34 -0800381 }
382
Austin Schuh58646e22021-08-23 23:51:46 -0700383 void DestroyEventLoop() { event_loop_unique_ptr_.reset(); }
384
385 EventLoop *MakeEventLoop() {
386 CHECK(!event_loop_unique_ptr_);
387 event_loop_unique_ptr_ =
388 node_event_loop_factory_->MakeEventLoop("log_reader");
389 return event_loop_unique_ptr_.get();
390 }
391
Austin Schuh2f8fd752020-09-01 22:38:28 -0700392 distributed_clock::time_point RemoteToDistributedClock(
393 size_t channel_index, monotonic_clock::time_point time) {
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700394 return channel_source_state_[channel_index]
395 ->node_event_loop_factory_->ToDistributedClock(time);
Austin Schuh2f8fd752020-09-01 22:38:28 -0700396 }
397
398 const Node *remote_node(size_t channel_index) {
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700399 return channel_source_state_[channel_index]
400 ->node_event_loop_factory_->node();
Austin Schuh2f8fd752020-09-01 22:38:28 -0700401 }
402
Stephan Pleines559fa6c2022-01-06 17:23:51 -0800403 monotonic_clock::time_point monotonic_now() const {
Austin Schuh2f8fd752020-09-01 22:38:28 -0700404 return node_event_loop_factory_->monotonic_now();
405 }
406
Austin Schuh858c9f32020-08-31 16:56:12 -0700407 // Sets the number of channels.
408 void SetChannelCount(size_t count);
409
410 // Sets the sender, filter, and target factory for a channel.
Austin Schuh969cd602021-01-03 00:09:45 -0800411 void SetChannel(size_t logged_channel_index, size_t factory_channel_index,
412 std::unique_ptr<RawSender> sender,
413 message_bridge::NoncausalOffsetEstimator *filter,
Austin Schuh58646e22021-08-23 23:51:46 -0700414 bool is_forwarded, State *source_state);
415
416 void SetRemoteTimestampSender(size_t logged_channel_index,
417 RemoteMessageSender *remote_timestamp_sender);
418
419 void RunOnStart();
420 void RunOnEnd();
Austin Schuh858c9f32020-08-31 16:56:12 -0700421
Austin Schuh858c9f32020-08-31 16:56:12 -0700422 // Unregisters everything so we can destory the event loop.
Austin Schuh58646e22021-08-23 23:51:46 -0700423 // TODO(austin): Is this needed? OnShutdown should be able to serve this
424 // need.
Austin Schuh858c9f32020-08-31 16:56:12 -0700425 void Deregister();
426
427 // Sets the current TimerHandle for the replay callback.
428 void set_timer_handler(TimerHandler *timer_handler) {
429 timer_handler_ = timer_handler;
Austin Schuh58646e22021-08-23 23:51:46 -0700430 if (timer_handler_) {
431 if (event_loop_->node() != nullptr) {
432 timer_handler_->set_name(absl::StrCat(
433 event_loop_->node()->name()->string_view(), "_main"));
434 } else {
435 timer_handler_->set_name("main");
436 }
437 }
Austin Schuh858c9f32020-08-31 16:56:12 -0700438 }
439
440 // Sets the next wakeup time on the replay callback.
441 void Setup(monotonic_clock::time_point next_time) {
442 timer_handler_->Setup(next_time);
443 }
444
445 // Sends a buffer on the provided channel index.
Austin Schuh287d43d2020-12-04 20:19:33 -0800446 bool Send(const TimestampedMessage &timestamped_message);
Austin Schuh858c9f32020-08-31 16:56:12 -0700447
448 // Returns a debug string for the channel merger.
Austin Schuh2f8fd752020-09-01 22:38:28 -0700449 std::string DebugString() const {
Austin Schuh287d43d2020-12-04 20:19:33 -0800450 if (!timestamp_mapper_) {
Austin Schuhe639ea12021-01-25 13:00:22 -0800451 return "";
Austin Schuh287d43d2020-12-04 20:19:33 -0800452 }
Austin Schuhe639ea12021-01-25 13:00:22 -0800453 return timestamp_mapper_->DebugString();
Austin Schuh2f8fd752020-09-01 22:38:28 -0700454 }
Austin Schuh858c9f32020-08-31 16:56:12 -0700455
Austin Schuh58646e22021-08-23 23:51:46 -0700456 void ClearRemoteTimestampSenders() {
457 channel_timestamp_loggers_.clear();
458 timestamp_loggers_.clear();
459 }
460
Austin Schuhbd5f74a2021-11-11 20:55:38 -0800461 void SetFoundLastMessage(bool val) {
462 found_last_message_ = val;
463 last_message_.resize(factory_channel_index_.size(), false);
464 }
465 bool found_last_message() const { return found_last_message_; }
466
467 void set_last_message(size_t channel_index) {
468 CHECK_LT(channel_index, last_message_.size());
469 last_message_[channel_index] = true;
470 }
471
472 bool last_message(size_t channel_index) {
473 CHECK_LT(channel_index, last_message_.size());
474 return last_message_[channel_index];
475 }
476
Austin Schuh858c9f32020-08-31 16:56:12 -0700477 private:
478 // Log file.
Austin Schuh287d43d2020-12-04 20:19:33 -0800479 std::unique_ptr<TimestampMapper> timestamp_mapper_;
Austin Schuh858c9f32020-08-31 16:56:12 -0700480
Austin Schuh858c9f32020-08-31 16:56:12 -0700481 // Senders.
482 std::vector<std::unique_ptr<RawSender>> channels_;
Austin Schuh969cd602021-01-03 00:09:45 -0800483 std::vector<RemoteMessageSender *> remote_timestamp_senders_;
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700484 // The mapping from logged channel index to sent channel index. Needed for
485 // sending out MessageHeaders.
486 std::vector<int> factory_channel_index_;
487
Austin Schuh9942bae2021-01-07 22:06:44 -0800488 struct ContiguousSentTimestamp {
489 // Most timestamps make it through the network, so it saves a ton of
490 // memory and CPU to store the start and end, and search for valid ranges.
491 // For one of the logs I looked at, we had 2 ranges for 4 days.
492 //
493 // Save monotonic times as well to help if a queue index ever wraps. Odds
494 // are very low, but doesn't hurt.
495 //
496 // The starting time and matching queue index.
497 monotonic_clock::time_point starting_monotonic_event_time =
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700498 monotonic_clock::min_time;
Austin Schuh9942bae2021-01-07 22:06:44 -0800499 uint32_t starting_queue_index = 0xffffffff;
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700500
Austin Schuh9942bae2021-01-07 22:06:44 -0800501 // Ending time and queue index.
502 monotonic_clock::time_point ending_monotonic_event_time =
503 monotonic_clock::max_time;
504 uint32_t ending_queue_index = 0xffffffff;
505
506 // The queue index that the first message was *actually* sent with. The
507 // queue indices are assumed to be contiguous through this range.
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700508 uint32_t actual_queue_index = 0xffffffff;
509 };
510
511 // Stores all the timestamps that have been sent on this channel. This is
512 // only done for channels which are forwarded and on the node which
Austin Schuh9942bae2021-01-07 22:06:44 -0800513 // initially sends the message. Compress using ranges and offsets.
514 std::vector<std::unique_ptr<std::vector<ContiguousSentTimestamp>>>
515 queue_index_map_;
Austin Schuh858c9f32020-08-31 16:56:12 -0700516
517 // Factory (if we are in sim) that this loop was created on.
518 NodeEventLoopFactory *node_event_loop_factory_ = nullptr;
519 std::unique_ptr<EventLoop> event_loop_unique_ptr_;
520 // Event loop.
Austin Schuh58646e22021-08-23 23:51:46 -0700521 const Node *node_ = nullptr;
Austin Schuh858c9f32020-08-31 16:56:12 -0700522 EventLoop *event_loop_ = nullptr;
523 // And timer used to send messages.
Austin Schuh58646e22021-08-23 23:51:46 -0700524 TimerHandler *timer_handler_ = nullptr;
525 TimerHandler *startup_timer_ = nullptr;
Austin Schuh858c9f32020-08-31 16:56:12 -0700526
Austin Schuh8bd96322020-02-13 21:18:22 -0800527 // Filters (or nullptr if it isn't a forwarded channel) for each channel.
528 // This corresponds to the object which is shared among all the channels
529 // going between 2 nodes. The second element in the tuple indicates if this
530 // is the primary direction or not.
Austin Schuh2f8fd752020-09-01 22:38:28 -0700531 std::vector<message_bridge::NoncausalOffsetEstimator *> filters_;
Austin Schuh8bd96322020-02-13 21:18:22 -0800532
533 // List of NodeEventLoopFactorys (or nullptr if it isn't a forwarded
534 // channel) which correspond to the originating node.
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700535 std::vector<State *> channel_source_state_;
536
Austin Schuh61e973f2021-02-21 21:43:56 -0800537 // This is a cache for channel, connection mapping to the corresponding
538 // sender.
539 absl::btree_map<std::pair<const Channel *, const Connection *>,
540 std::shared_ptr<RemoteMessageSender>>
541 channel_timestamp_loggers_;
542
543 // Mapping from resolved RemoteMessage channel to RemoteMessage sender. This
544 // is the channel that timestamps are published to.
545 absl::btree_map<const Channel *, std::shared_ptr<RemoteMessageSender>>
546 timestamp_loggers_;
Austin Schuh58646e22021-08-23 23:51:46 -0700547
548 std::vector<std::function<void()>> on_starts_;
549 std::vector<std::function<void()>> on_ends_;
550
551 bool stopped_ = false;
552 bool started_ = false;
Austin Schuhbd5f74a2021-11-11 20:55:38 -0800553
554 bool found_last_message_ = false;
555 std::vector<bool> last_message_;
Austin Schuh6f3babe2020-01-26 20:34:50 -0800556 };
557
Austin Schuh8bd96322020-02-13 21:18:22 -0800558 // Node index -> State.
559 std::vector<std::unique_ptr<State>> states_;
560
561 // Creates the requested filter if it doesn't exist, regardless of whether
562 // these nodes can actually communicate directly. The second return value
563 // reports if this is the primary direction or not.
Austin Schuh2f8fd752020-09-01 22:38:28 -0700564 message_bridge::NoncausalOffsetEstimator *GetFilter(const Node *node_a,
565 const Node *node_b);
Austin Schuh8bd96322020-02-13 21:18:22 -0800566
Austin Schuh8bd96322020-02-13 21:18:22 -0800567 // List of filters for a connection. The pointer to the first node will be
568 // less than the second node.
Austin Schuh0ca1fd32020-12-18 22:53:05 -0800569 std::unique_ptr<message_bridge::MultiNodeNoncausalOffsetEstimator> filters_;
Austin Schuh8bd96322020-02-13 21:18:22 -0800570
James Kuszmaul84ff3e52020-01-03 19:48:53 -0800571 std::unique_ptr<FlatbufferDetachedBuffer<Configuration>>
572 remapped_configuration_buffer_;
573
James Kuszmaul84ff3e52020-01-03 19:48:53 -0800574 std::unique_ptr<SimulatedEventLoopFactory> event_loop_factory_unique_ptr_;
575 SimulatedEventLoopFactory *event_loop_factory_ = nullptr;
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800576
577 // Map of channel indices to new name. The channel index will be an index into
578 // logged_configuration(), and the string key will be the name of the channel
579 // to send on instead of the logged channel name.
Austin Schuh0de30f32020-12-06 12:44:28 -0800580 struct RemappedChannel {
581 std::string remapped_name;
582 std::string new_type;
583 };
584 std::map<size_t, RemappedChannel> remapped_channels_;
Austin Schuh01b4c352020-09-21 23:09:39 -0700585 std::vector<MapT> maps_;
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800586
Austin Schuh6f3babe2020-01-26 20:34:50 -0800587 // Number of nodes which still have data to send. This is used to figure out
588 // when to exit.
589 size_t live_nodes_ = 0;
590
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800591 const Configuration *remapped_configuration_ = nullptr;
592 const Configuration *replay_configuration_ = nullptr;
Austin Schuhcde938c2020-02-02 17:30:07 -0800593
594 // If true, the replay timer will ignore any missing data. This is used
595 // during startup when we are bootstrapping everything and trying to get to
596 // the start of all the log files.
597 bool ignore_missing_data_ = false;
James Kuszmaul71a81932020-12-15 21:08:01 -0800598
599 // Whether to exit the SimulatedEventLoop when we finish reading the logs.
600 bool exit_on_finish_ = true;
Austin Schuhe309d2a2019-11-29 13:25:21 -0800601};
602
603} // namespace logger
604} // namespace aos
605
Austin Schuhb06f03b2021-02-17 22:00:37 -0800606#endif // AOS_EVENTS_LOGGING_LOG_READER_H_