blob: 49babe594faa57788949a8267af686d67d532a77 [file] [log] [blame]
Austin Schuhb06f03b2021-02-17 22:00:37 -08001#ifndef AOS_EVENTS_LOGGING_LOG_READER_H_
2#define AOS_EVENTS_LOGGING_LOG_READER_H_
Austin Schuhe309d2a2019-11-29 13:25:21 -08003
Austin Schuh8bd96322020-02-13 21:18:22 -08004#include <chrono>
Austin Schuhe309d2a2019-11-29 13:25:21 -08005#include <deque>
James Kuszmaula16a7912022-06-17 10:58:12 -07006#include <queue>
James Kuszmaulc3f34d12022-08-15 15:57:55 -07007#include <string_view>
Austin Schuh2f8fd752020-09-01 22:38:28 -07008#include <tuple>
Austin Schuh6f3babe2020-01-26 20:34:50 -08009#include <vector>
Austin Schuhe309d2a2019-11-29 13:25:21 -080010
James Kuszmaulc3f34d12022-08-15 15:57:55 -070011#include "aos/condition.h"
Austin Schuhe309d2a2019-11-29 13:25:21 -080012#include "aos/events/event_loop.h"
Austin Schuhf6f9bf32020-10-11 14:37:43 -070013#include "aos/events/logging/logfile_sorting.h"
Austin Schuha36c8902019-12-30 18:07:15 -080014#include "aos/events/logging/logfile_utils.h"
James Kuszmaul38735e82019-12-07 16:42:06 -080015#include "aos/events/logging/logger_generated.h"
James Kuszmaula16a7912022-06-17 10:58:12 -070016#include "aos/events/logging/replay_timing_generated.h"
James Kuszmaul09632422022-05-25 15:56:19 -070017#include "aos/events/shm_event_loop.h"
Austin Schuh92547522019-12-28 14:33:43 -080018#include "aos/events/simulated_event_loop.h"
James Kuszmaulc3f34d12022-08-15 15:57:55 -070019#include "aos/mutex/mutex.h"
Austin Schuh2f8fd752020-09-01 22:38:28 -070020#include "aos/network/message_bridge_server_generated.h"
Austin Schuh0ca1fd32020-12-18 22:53:05 -080021#include "aos/network/multinode_timestamp_filter.h"
Austin Schuh0de30f32020-12-06 12:44:28 -080022#include "aos/network/remote_message_generated.h"
Austin Schuh8bd96322020-02-13 21:18:22 -080023#include "aos/network/timestamp_filter.h"
Austin Schuhe309d2a2019-11-29 13:25:21 -080024#include "aos/time/time.h"
James Kuszmaula16a7912022-06-17 10:58:12 -070025#include "aos/util/threaded_queue.h"
James Kuszmaulc3f34d12022-08-15 15:57:55 -070026#include "aos/uuid.h"
Austin Schuhe309d2a2019-11-29 13:25:21 -080027#include "flatbuffers/flatbuffers.h"
28
29namespace aos {
30namespace logger {
31
Austin Schuhe33c08d2022-02-03 18:15:21 -080032class EventNotifier;
33
Eric Schmiedebergb38477e2022-12-02 16:08:04 -070034// Vector of pair of name and type of the channel
Sanjay Narayanan5ec00232022-07-08 15:21:30 -070035using ReplayChannels = std::vector<std::pair<std::string, std::string>>;
Eric Schmiedebergb38477e2022-12-02 16:08:04 -070036// Vector of channel indices
Naman Guptacf6d4422023-03-01 11:41:00 -080037using ReplayChannelIndices = std::vector<size_t>;
Eric Schmiedebergb38477e2022-12-02 16:08:04 -070038
Austin Schuh6f3babe2020-01-26 20:34:50 -080039// We end up with one of the following 3 log file types.
40//
41// Single node logged as the source node.
42// -> Replayed just on the source node.
43//
44// Forwarding timestamps only logged from the perspective of the destination
45// node.
46// -> Matched with data on source node and logged.
47//
48// Forwarding timestamps with data logged as the destination node.
49// -> Replayed just as the destination
50// -> Replayed as the source (Much harder, ordering is not defined)
51//
52// Duplicate data logged. -> CHECK that it matches and explode otherwise.
53//
54// This can be boiled down to a set of constraints and tools.
55//
56// 1) Forwarding timestamps and data need to be logged separately.
57// 2) Any forwarded data logged on the destination node needs to be logged
58// separately such that it can be sorted.
59//
60// 1) Log reader needs to be able to sort a list of log files.
61// 2) Log reader needs to be able to merge sorted lists of log files.
62// 3) Log reader needs to be able to match timestamps with messages.
63//
64// We also need to be able to generate multiple views of a log file depending on
65// the target.
James Kuszmaul298b4a22023-06-28 20:01:03 -070066//
67// In general, we aim to guarantee that if you are using the LogReader
68// "normally" you should be able to observe all the messages that existed on the
69// live system between the start time and the end of the logfile, and that
70// CHECK-failures will be generated if the LogReader cannot satisfy that
71// guarantee. There are currently a few deliberate exceptions to this:
72// * Any channel marked NOT_LOGGED in the configuration is known not to
73// have been logged and thus will be silently absent in log replay.
74// * If an incomplete set of log files is provided to the reader (e.g.,
75// only logs logged on a single node on a multi-node system), then
76// any *individual* channel as observed on a given node will be
77// consistent, but similarly to a NOT_LOGGED channel, some data may
78// not be available.
79// * At the end of a log, data for some channels/nodes may end before
80// others; during this time period, you may observe silently dropped
81// messages. This will be most obvious on uncleanly terminated logs or
82// when merging logfiles across nodes (as the logs on different nodes
83// will not finish at identical times).
Austin Schuh6f3babe2020-01-26 20:34:50 -080084
Austin Schuhe309d2a2019-11-29 13:25:21 -080085// Replays all the channels in the logfile to the event loop.
86class LogReader {
87 public:
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -080088 // If you want to supply a new configuration that will be used for replay
89 // (e.g., to change message rates, or to populate an updated schema), then
90 // pass it in here. It must provide all the channels that the original logged
91 // config did.
Austin Schuh6f3babe2020-01-26 20:34:50 -080092 //
Eric Schmiedebergb38477e2022-12-02 16:08:04 -070093 // If certain messages should not be replayed, the replay_channels param can
94 // be used as an inclusive list of channels for messages to be replayed.
95 //
Austin Schuh287d43d2020-12-04 20:19:33 -080096 // The single file constructor calls SortParts internally.
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -080097 LogReader(std::string_view filename,
Eric Schmiedebergb38477e2022-12-02 16:08:04 -070098 const Configuration *replay_configuration = nullptr,
99 const ReplayChannels *replay_channels = nullptr);
Austin Schuh287d43d2020-12-04 20:19:33 -0800100 LogReader(std::vector<LogFile> log_files,
Eric Schmiedebergb38477e2022-12-02 16:08:04 -0700101 const Configuration *replay_configuration = nullptr,
102 const ReplayChannels *replay_channels = nullptr);
James Kuszmaul7daef362019-12-31 18:28:17 -0800103 ~LogReader();
Austin Schuhe309d2a2019-11-29 13:25:21 -0800104
Austin Schuh6331ef92020-01-07 18:28:09 -0800105 // Registers all the callbacks to send the log file data out on an event loop
106 // created in event_loop_factory. This also updates time to be at the start
107 // of the log file by running until the log file starts.
108 // Note: the configuration used in the factory should be configuration()
109 // below, but can be anything as long as the locations needed to send
110 // everything are available.
James Kuszmaul84ff3e52020-01-03 19:48:53 -0800111 void Register(SimulatedEventLoopFactory *event_loop_factory);
Austin Schuhe33c08d2022-02-03 18:15:21 -0800112
Austin Schuh58646e22021-08-23 23:51:46 -0700113 // Registers all the callbacks to send the log file data out to an event loop
114 // factory. This does not start replaying or change the current distributed
115 // time of the factory. It does change the monotonic clocks to be right.
116 void RegisterWithoutStarting(SimulatedEventLoopFactory *event_loop_factory);
Austin Schuhe33c08d2022-02-03 18:15:21 -0800117 // Runs the log until the last start time. Register above is defined as:
118 // Register(...) {
119 // RegisterWithoutStarting
120 // StartAfterRegister
121 // }
122 // This should generally be considered as a stepping stone to convert from
123 // Register() to RegisterWithoutStarting() incrementally.
124 void StartAfterRegister(SimulatedEventLoopFactory *event_loop_factory);
125
Austin Schuh6331ef92020-01-07 18:28:09 -0800126 // Creates an SimulatedEventLoopFactory accessible via event_loop_factory(),
127 // and then calls Register.
128 void Register();
James Kuszmaul09632422022-05-25 15:56:19 -0700129
Austin Schuh6331ef92020-01-07 18:28:09 -0800130 // Registers callbacks for all the events after the log file starts. This is
131 // only useful when replaying live.
Austin Schuhe309d2a2019-11-29 13:25:21 -0800132 void Register(EventLoop *event_loop);
Austin Schuh6331ef92020-01-07 18:28:09 -0800133
James Kuszmaula16a7912022-06-17 10:58:12 -0700134 // Sets a sender that should be used for tracking timing statistics. If not
135 // set, no statistics will be recorded.
136 void set_timing_accuracy_sender(
137 const Node *node, aos::Sender<timing::ReplayTiming> timing_sender) {
138 states_[configuration::GetNodeIndex(configuration(), node)]
139 ->set_timing_accuracy_sender(std::move(timing_sender));
140 }
141
Austin Schuh58646e22021-08-23 23:51:46 -0700142 // Called whenever a log file starts for a node.
James Kuszmaul82c3b512023-07-08 20:25:41 -0700143 // More precisely, this will be called on each boot at max of
144 // (realtime_start_time in the logfiles, SetStartTime()). If a given boot
145 // occurs entirely before the realtime_start_time, the OnStart handler will
146 // never get called for that boot.
147 //
148 // realtime_start_time is defined below, but/ essentially is the time at which
149 // message channels will start being internall consistent on a given node
150 // (i.e., when the logger started). Note: If you wish to see a watcher
151 // triggered for *every* message in a log, OnStart() will not be
152 // sufficient--messages (possibly multiple messages) may be present on
153 // channels prior to the start time. If attempting to do this, prefer to use
154 // NodeEventLoopFactory::OnStart.
Austin Schuh58646e22021-08-23 23:51:46 -0700155 void OnStart(std::function<void()> fn);
156 void OnStart(const Node *node, std::function<void()> fn);
James Kuszmaul82c3b512023-07-08 20:25:41 -0700157 // Called whenever a log file ends for a node on a given boot, or at the
158 // realtime_end_time specified by a flag or SetEndTime().
159 //
160 // A log file "ends" when there are no more messages to be replayed for that
161 // boot.
162 //
163 // If OnStart() is not called for a given boot, the OnEnd() handlers will not
164 // be called either. OnEnd() handlers will not be called if the logfile for a
165 // given boot has missing data that causes us to terminate replay early.
Austin Schuh58646e22021-08-23 23:51:46 -0700166 void OnEnd(std::function<void()> fn);
167 void OnEnd(const Node *node, std::function<void()> fn);
168
James Kuszmaul84ff3e52020-01-03 19:48:53 -0800169 // Unregisters the senders. You only need to call this if you separately
170 // supplied an event loop or event loop factory and the lifetimes are such
171 // that they need to be explicitly destroyed before the LogReader destructor
172 // gets called.
Austin Schuhe309d2a2019-11-29 13:25:21 -0800173 void Deregister();
174
Austin Schuh0c297012020-09-16 18:41:59 -0700175 // Returns the configuration being used for replay from the log file.
176 // Note that this may be different from the configuration actually used for
177 // handling events. You should generally only use this to create a
178 // SimulatedEventLoopFactory, and then get the configuration from there for
179 // everything else.
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800180 const Configuration *logged_configuration() const;
Austin Schuh11d43732020-09-21 17:28:30 -0700181 // Returns the configuration being used for replay from the log file.
182 // Note that this may be different from the configuration actually used for
183 // handling events. You should generally only use this to create a
184 // SimulatedEventLoopFactory, and then get the configuration from there for
185 // everything else.
Austin Schuh6f3babe2020-01-26 20:34:50 -0800186 // The pointer is invalidated whenever RemapLoggedChannel is called.
Austin Schuh15649d62019-12-28 16:36:38 -0800187 const Configuration *configuration() const;
188
Austin Schuh6f3babe2020-01-26 20:34:50 -0800189 // Returns the nodes that this log file was created on. This is a list of
Austin Schuh07676622021-01-21 18:59:17 -0800190 // pointers to a node in the nodes() list inside logged_configuration().
191 std::vector<const Node *> LoggedNodes() const;
Austin Schuhe309d2a2019-11-29 13:25:21 -0800192
193 // Returns the starting timestamp for the log file.
James Kuszmaul298b4a22023-06-28 20:01:03 -0700194 // All logged channels for the specified node should be entirely available
195 // after the specified time (i.e., any message that was available on the node
196 // in question after the monotonic start time but before the logs end and
197 // whose channel is present in any of the provided logs will either be
198 // available in the log or will result in an internal CHECK-failure of the
199 // LogReader if it would be skipped).
Austin Schuh11d43732020-09-21 17:28:30 -0700200 monotonic_clock::time_point monotonic_start_time(
201 const Node *node = nullptr) const;
202 realtime_clock::time_point realtime_start_time(
203 const Node *node = nullptr) const;
Austin Schuhe309d2a2019-11-29 13:25:21 -0800204
Austin Schuhe33c08d2022-02-03 18:15:21 -0800205 // Sets the start and end times to replay data until for all nodes. This
206 // overrides the --start_time and --end_time flags. The default is to replay
207 // all data.
208 void SetStartTime(std::string start_time);
209 void SetStartTime(realtime_clock::time_point start_time);
210 void SetEndTime(std::string end_time);
211 void SetEndTime(realtime_clock::time_point end_time);
212
James Kuszmaul53da7f32022-09-11 11:11:55 -0700213 // Enum to use for indicating how RemapLoggedChannel behaves when there is
214 // already a channel with the remapped name (e.g., as may happen when
215 // replaying a logfile that was itself generated from replay).
216 enum class RemapConflict {
217 // LOG(FATAL) on conflicts in remappings.
218 kDisallow,
219 // If we run into a conflict, attempt to remap the channel we would be
220 // overriding (and continue to do so if remapping *that* channel also
221 // generates a conflict).
222 // This will mean that if we repeatedly replay a log, we will end up
223 // stacking more and more /original's on the start of the oldest version
224 // of the channels.
225 kCascade
226 };
227
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800228 // Causes the logger to publish the provided channel on a different name so
229 // that replayed applications can publish on the proper channel name without
230 // interference. This operates on raw channel names, without any node or
231 // application specific mappings.
James Kuszmaul53da7f32022-09-11 11:11:55 -0700232 void RemapLoggedChannel(
233 std::string_view name, std::string_view type,
234 std::string_view add_prefix = "/original", std::string_view new_type = "",
235 RemapConflict conflict_handling = RemapConflict::kCascade);
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800236 template <typename T>
James Kuszmaul53da7f32022-09-11 11:11:55 -0700237 void RemapLoggedChannel(
238 std::string_view name, std::string_view add_prefix = "/original",
239 std::string_view new_type = "",
240 RemapConflict conflict_handling = RemapConflict::kCascade) {
241 RemapLoggedChannel(name, T::GetFullyQualifiedName(), add_prefix, new_type,
242 conflict_handling);
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800243 }
Austin Schuh01b4c352020-09-21 23:09:39 -0700244 // Remaps the provided channel, though this respects node mappings, and
245 // preserves them too. This makes it so if /aos -> /pi1/aos on one node,
246 // /original/aos -> /original/pi1/aos on the same node after renaming, just
Austin Schuh0de30f32020-12-06 12:44:28 -0800247 // like you would hope. If new_type is not empty, the new channel will use
248 // the provided type instead. This allows for renaming messages.
Austin Schuh01b4c352020-09-21 23:09:39 -0700249 //
250 // TODO(austin): If you have 2 nodes remapping something to the same channel,
251 // this doesn't handle that. No use cases exist yet for that, so it isn't
252 // being done yet.
James Kuszmaul53da7f32022-09-11 11:11:55 -0700253 void RemapLoggedChannel(
254 std::string_view name, std::string_view type, const Node *node,
255 std::string_view add_prefix = "/original", std::string_view new_type = "",
256 RemapConflict conflict_handling = RemapConflict::kCascade);
Brian Silvermande9f3ff2020-04-28 16:56:58 -0700257 template <typename T>
James Kuszmaul53da7f32022-09-11 11:11:55 -0700258 void RemapLoggedChannel(
259 std::string_view name, const Node *node,
260 std::string_view add_prefix = "/original", std::string_view new_type = "",
261 RemapConflict conflict_handling = RemapConflict::kCascade) {
Austin Schuh0de30f32020-12-06 12:44:28 -0800262 RemapLoggedChannel(name, T::GetFullyQualifiedName(), node, add_prefix,
James Kuszmaul53da7f32022-09-11 11:11:55 -0700263 new_type, conflict_handling);
Austin Schuh01b4c352020-09-21 23:09:39 -0700264 }
265
Sanjay Narayanan5ec00232022-07-08 15:21:30 -0700266 // Similar to RemapLoggedChannel(), but lets you specify a name for the new
267 // channel without constraints. This is useful when an application has been
268 // updated to use new channels but you want to support replaying old logs. By
269 // default, this will not add any maps for the new channel. Use add_maps to
270 // specify any maps you'd like added.
271 void RenameLoggedChannel(std::string_view name, std::string_view type,
272 std::string_view new_name,
273 const std::vector<MapT> &add_maps = {});
274 template <typename T>
275 void RenameLoggedChannel(std::string_view name, std::string_view new_name,
276 const std::vector<MapT> &add_maps = {}) {
277 RenameLoggedChannel(name, T::GetFullyQualifiedName(), new_name, add_maps);
278 }
279 // The following overloads are more suitable for multi-node configurations,
280 // and let you rename a channel on a specific node.
281 void RenameLoggedChannel(std::string_view name, std::string_view type,
282 const Node *node, std::string_view new_name,
283 const std::vector<MapT> &add_maps = {});
284 template <typename T>
285 void RenameLoggedChannel(std::string_view name, const Node *node,
286 std::string_view new_name,
287 const std::vector<MapT> &add_maps = {}) {
288 RenameLoggedChannel(name, T::GetFullyQualifiedName(), node, new_name,
289 add_maps);
290 }
291
Austin Schuh01b4c352020-09-21 23:09:39 -0700292 template <typename T>
293 bool HasChannel(std::string_view name, const Node *node = nullptr) {
Sanjay Narayanan5ec00232022-07-08 15:21:30 -0700294 return HasChannel(name, T::GetFullyQualifiedName(), node);
295 }
296 bool HasChannel(std::string_view name, std::string_view type,
297 const Node *node) {
298 return configuration::GetChannel(logged_configuration(), name, type, "",
299 node, true) != nullptr;
Brian Silvermande9f3ff2020-04-28 16:56:58 -0700300 }
301
Austin Schuh82529062021-12-08 12:09:52 -0800302 template <typename T>
303 void MaybeRemapLoggedChannel(std::string_view name,
304 const Node *node = nullptr) {
305 if (HasChannel<T>(name, node)) {
306 RemapLoggedChannel<T>(name, node);
307 }
308 }
Sanjay Narayanan5ec00232022-07-08 15:21:30 -0700309 template <typename T>
310 void MaybeRenameLoggedChannel(std::string_view name, const Node *node,
311 std::string_view new_name,
312 const std::vector<MapT> &add_maps = {}) {
313 if (HasChannel<T>(name, node)) {
314 RenameLoggedChannel<T>(name, node, new_name, add_maps);
315 }
316 }
Austin Schuh82529062021-12-08 12:09:52 -0800317
James Kuszmaul4f106fb2021-01-05 20:53:02 -0800318 // Returns true if the channel exists on the node and was logged.
319 template <typename T>
320 bool HasLoggedChannel(std::string_view name, const Node *node = nullptr) {
Austin Schuh5ee56872021-01-30 16:53:34 -0800321 const Channel *channel =
322 configuration::GetChannel(logged_configuration(), name,
323 T::GetFullyQualifiedName(), "", node, true);
James Kuszmaul4f106fb2021-01-05 20:53:02 -0800324 if (channel == nullptr) return false;
325 return channel->logger() != LoggerConfig::NOT_LOGGED;
326 }
327
Austin Schuh1c227352021-09-17 12:53:54 -0700328 // Returns a list of all the original channels from remapping.
329 std::vector<const Channel *> RemappedChannels() const;
330
James Kuszmaul84ff3e52020-01-03 19:48:53 -0800331 SimulatedEventLoopFactory *event_loop_factory() {
332 return event_loop_factory_;
333 }
334
Austin Schuh0ca51f32020-12-25 21:51:45 -0800335 std::string_view name() const { return log_files_[0].name; }
Austin Schuh84dd1332023-05-03 13:09:47 -0700336 std::string_view log_event_uuid() const {
337 return log_files_[0].log_event_uuid;
338 }
Austin Schuh0c297012020-09-16 18:41:59 -0700339
James Kuszmaul71a81932020-12-15 21:08:01 -0800340 // Set whether to exit the SimulatedEventLoopFactory when we finish reading
341 // the logfile.
342 void set_exit_on_finish(bool exit_on_finish) {
343 exit_on_finish_ = exit_on_finish;
344 }
James Kuszmaulb11a1502022-07-01 16:02:25 -0700345 bool exit_on_finish() const { return exit_on_finish_; }
James Kuszmaul71a81932020-12-15 21:08:01 -0800346
James Kuszmaulb67409b2022-06-20 16:25:03 -0700347 // Sets the realtime replay rate. A value of 1.0 will cause the scheduler to
348 // try to play events in realtime. 0.5 will run at half speed. Use infinity
349 // (the default) to run as fast as possible. This can be changed during
350 // run-time.
351 // Only applies when running against a SimulatedEventLoopFactory.
352 void SetRealtimeReplayRate(double replay_rate);
353
Austin Schuhe309d2a2019-11-29 13:25:21 -0800354 private:
Austin Schuh58646e22021-08-23 23:51:46 -0700355 void Register(EventLoop *event_loop, const Node *node);
356
357 void RegisterDuringStartup(EventLoop *event_loop, const Node *node);
358
359 const Channel *RemapChannel(const EventLoop *event_loop, const Node *node,
Austin Schuh6f3babe2020-01-26 20:34:50 -0800360 const Channel *channel);
361
Austin Schuhe309d2a2019-11-29 13:25:21 -0800362 // Queues at least max_out_of_order_duration_ messages into channels_.
363 void QueueMessages();
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800364 // Handle constructing a configuration with all the additional remapped
365 // channels from calls to RemapLoggedChannel.
366 void MakeRemappedConfig();
Austin Schuhe309d2a2019-11-29 13:25:21 -0800367
Austin Schuh2f8fd752020-09-01 22:38:28 -0700368 // Returns the number of nodes.
369 size_t nodes_count() const {
370 return !configuration::MultiNode(logged_configuration())
371 ? 1u
372 : logged_configuration()->nodes()->size();
373 }
374
James Kuszmaulb11a1502022-07-01 16:02:25 -0700375 // Handles when an individual node hits the realtime end time, exitting the
376 // entire event loop once all nodes are stopped.
377 void NoticeRealtimeEnd();
378
Austin Schuh287d43d2020-12-04 20:19:33 -0800379 const std::vector<LogFile> log_files_;
Austin Schuh6f3babe2020-01-26 20:34:50 -0800380
Austin Schuh969cd602021-01-03 00:09:45 -0800381 // Class to manage sending RemoteMessages on the provided node after the
382 // correct delay.
Austin Schuh5ee56872021-01-30 16:53:34 -0800383 class RemoteMessageSender {
Austin Schuh969cd602021-01-03 00:09:45 -0800384 public:
385 RemoteMessageSender(aos::Sender<message_bridge::RemoteMessage> sender,
386 EventLoop *event_loop);
387 RemoteMessageSender(RemoteMessageSender const &) = delete;
388 RemoteMessageSender &operator=(RemoteMessageSender const &) = delete;
389
390 // Sends the provided message. If monotonic_timestamp_time is min_time,
391 // send it immediately.
392 void Send(
393 FlatbufferDetachedBuffer<message_bridge::RemoteMessage> remote_message,
Austin Schuh58646e22021-08-23 23:51:46 -0700394 BootTimestamp monotonic_timestamp_time, size_t source_boot_count);
Austin Schuh969cd602021-01-03 00:09:45 -0800395
396 private:
397 // Handles actually sending the timestamp if we were delayed.
398 void SendTimestamp();
399 // Handles scheduling the timer to send at the correct time.
400 void ScheduleTimestamp();
401
402 EventLoop *event_loop_;
403 aos::Sender<message_bridge::RemoteMessage> sender_;
404 aos::TimerHandler *timer_;
405
406 // Time we are scheduled for, or min_time if we aren't scheduled.
407 monotonic_clock::time_point scheduled_time_ = monotonic_clock::min_time;
408
409 struct Timestamp {
410 Timestamp(FlatbufferDetachedBuffer<message_bridge::RemoteMessage>
411 new_remote_message,
412 monotonic_clock::time_point new_monotonic_timestamp_time)
413 : remote_message(std::move(new_remote_message)),
414 monotonic_timestamp_time(new_monotonic_timestamp_time) {}
415 FlatbufferDetachedBuffer<message_bridge::RemoteMessage> remote_message;
416 monotonic_clock::time_point monotonic_timestamp_time;
417 };
418
419 // List of messages to send. The timer works through them and then disables
420 // itself automatically.
421 std::deque<Timestamp> remote_timestamps_;
422 };
423
Austin Schuh6f3babe2020-01-26 20:34:50 -0800424 // State per node.
Austin Schuh858c9f32020-08-31 16:56:12 -0700425 class State {
426 public:
James Kuszmaula16a7912022-06-17 10:58:12 -0700427 // Whether we should spin up a separate thread for buffering up messages.
428 // Only allowed in realtime replay--see comments on threading_ member for
429 // details.
430 enum class ThreadedBuffering { kYes, kNo };
James Kuszmaul09632422022-05-25 15:56:19 -0700431 State(std::unique_ptr<TimestampMapper> timestamp_mapper,
432 message_bridge::MultiNodeNoncausalOffsetEstimator *multinode_filters,
James Kuszmaulb11a1502022-07-01 16:02:25 -0700433 std::function<void()> notice_realtime_end, const Node *node,
434 ThreadedBuffering threading,
Naman Guptacf6d4422023-03-01 11:41:00 -0800435 std::unique_ptr<const ReplayChannelIndices> replay_channel_indices);
Austin Schuh287d43d2020-12-04 20:19:33 -0800436
437 // Connects up the timestamp mappers.
438 void AddPeer(State *peer);
Austin Schuh6f3babe2020-01-26 20:34:50 -0800439
Austin Schuhe639ea12021-01-25 13:00:22 -0800440 TimestampMapper *timestamp_mapper() { return timestamp_mapper_.get(); }
441
Austin Schuhdda74ec2021-01-03 19:30:37 -0800442 // Returns the next sorted message with all the timestamps extracted and
443 // matched.
444 TimestampedMessage PopOldest();
Austin Schuh188eabe2020-12-29 23:41:13 -0800445
Austin Schuh858c9f32020-08-31 16:56:12 -0700446 // Returns the monotonic time of the oldest message.
James Kuszmaula16a7912022-06-17 10:58:12 -0700447 BootTimestamp SingleThreadedOldestMessageTime();
448 // Returns the monotonic time of the oldest message, handling querying the
449 // separate thread of ThreadedBuffering was set.
450 BootTimestamp MultiThreadedOldestMessageTime();
Austin Schuh58646e22021-08-23 23:51:46 -0700451
452 size_t boot_count() const {
453 // If we are replaying directly into an event loop, we can't reboot. So
454 // we will stay stuck on the 0th boot.
James Kuszmaul09632422022-05-25 15:56:19 -0700455 if (!node_event_loop_factory_) {
456 if (event_loop_ == nullptr) {
457 // If boot_count is being checked after startup for any of the
458 // non-primary nodes, then returning 0 may not be accurate (since
459 // remote nodes *can* reboot even if the EventLoop being played to
460 // can't).
461 CHECK(!started_);
462 CHECK(!stopped_);
463 }
464 return 0u;
465 }
Austin Schuh58646e22021-08-23 23:51:46 -0700466 return node_event_loop_factory_->boot_count();
467 }
Austin Schuh858c9f32020-08-31 16:56:12 -0700468
469 // Primes the queues inside State. Should be called before calling
470 // OldestMessageTime.
471 void SeedSortedMessages();
Austin Schuh8bd96322020-02-13 21:18:22 -0800472
Austin Schuh58646e22021-08-23 23:51:46 -0700473 void SetupStartupTimer() {
474 const monotonic_clock::time_point start_time =
475 monotonic_start_time(boot_count());
476 if (start_time == monotonic_clock::min_time) {
477 LOG(ERROR)
478 << "No start time, skipping, please figure out when this happens";
Austin Schuhe33c08d2022-02-03 18:15:21 -0800479 NotifyLogfileStart();
Austin Schuh58646e22021-08-23 23:51:46 -0700480 return;
481 }
James Kuszmaul09632422022-05-25 15:56:19 -0700482 if (node_event_loop_factory_) {
483 CHECK_GE(start_time + clock_offset(), event_loop_->monotonic_now());
484 }
485 startup_timer_->Setup(start_time + clock_offset());
Austin Schuh58646e22021-08-23 23:51:46 -0700486 }
487
488 void set_startup_timer(TimerHandler *timer_handler) {
489 startup_timer_ = timer_handler;
490 if (startup_timer_) {
491 if (event_loop_->node() != nullptr) {
492 startup_timer_->set_name(absl::StrCat(
493 event_loop_->node()->name()->string_view(), "_startup"));
494 } else {
495 startup_timer_->set_name("startup");
496 }
497 }
498 }
499
Austin Schuh858c9f32020-08-31 16:56:12 -0700500 // Returns the starting time for this node.
Austin Schuh2dc8c7d2021-07-01 17:41:28 -0700501 monotonic_clock::time_point monotonic_start_time(size_t boot_count) const {
502 return timestamp_mapper_
503 ? timestamp_mapper_->monotonic_start_time(boot_count)
504 : monotonic_clock::min_time;
Austin Schuh858c9f32020-08-31 16:56:12 -0700505 }
Austin Schuh2dc8c7d2021-07-01 17:41:28 -0700506 realtime_clock::time_point realtime_start_time(size_t boot_count) const {
507 return timestamp_mapper_
508 ? timestamp_mapper_->realtime_start_time(boot_count)
509 : realtime_clock::min_time;
Austin Schuh858c9f32020-08-31 16:56:12 -0700510 }
511
512 // Sets the node event loop factory for replaying into a
513 // SimulatedEventLoopFactory. Returns the EventLoop to use.
Austin Schuh60e77942022-05-16 17:48:24 -0700514 void SetNodeEventLoopFactory(NodeEventLoopFactory *node_event_loop_factory,
515 SimulatedEventLoopFactory *event_loop_factory);
Austin Schuh858c9f32020-08-31 16:56:12 -0700516
517 // Sets and gets the event loop to use.
518 void set_event_loop(EventLoop *event_loop) { event_loop_ = event_loop; }
519 EventLoop *event_loop() { return event_loop_; }
520
Austin Schuh58646e22021-08-23 23:51:46 -0700521 const Node *node() const { return node_; }
522
523 void Register(EventLoop *event_loop);
524
525 void OnStart(std::function<void()> fn);
526 void OnEnd(std::function<void()> fn);
527
Austin Schuh858c9f32020-08-31 16:56:12 -0700528 // Sets the current realtime offset from the monotonic clock for this node
529 // (if we are on a simulated event loop).
530 void SetRealtimeOffset(monotonic_clock::time_point monotonic_time,
531 realtime_clock::time_point realtime_time) {
532 if (node_event_loop_factory_ != nullptr) {
533 node_event_loop_factory_->SetRealtimeOffset(monotonic_time,
534 realtime_time);
535 }
536 }
537
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700538 // Returns the MessageHeader sender to log delivery timestamps to for the
539 // provided remote node.
Austin Schuh61e973f2021-02-21 21:43:56 -0800540 RemoteMessageSender *RemoteTimestampSender(const Channel *channel,
541 const Connection *connection);
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700542
Austin Schuh858c9f32020-08-31 16:56:12 -0700543 // Converts a timestamp from the monotonic clock on this node to the
544 // distributed clock.
545 distributed_clock::time_point ToDistributedClock(
546 monotonic_clock::time_point time) {
James Kuszmaul09632422022-05-25 15:56:19 -0700547 CHECK(node_event_loop_factory_);
Austin Schuh858c9f32020-08-31 16:56:12 -0700548 return node_event_loop_factory_->ToDistributedClock(time);
549 }
550
Austin Schuh858c9f32020-08-31 16:56:12 -0700551 // Returns the current time on the remote node which sends messages on
552 // channel_index.
Austin Schuh58646e22021-08-23 23:51:46 -0700553 BootTimestamp monotonic_remote_now(size_t channel_index) {
554 State *s = channel_source_state_[channel_index];
555 return BootTimestamp{
556 .boot = s->boot_count(),
557 .time = s->node_event_loop_factory_->monotonic_now()};
Austin Schuh858c9f32020-08-31 16:56:12 -0700558 }
559
Austin Schuh5ee56872021-01-30 16:53:34 -0800560 // Returns the start time of the remote for the provided channel.
561 monotonic_clock::time_point monotonic_remote_start_time(
Austin Schuh58646e22021-08-23 23:51:46 -0700562 size_t boot_count, size_t channel_index) {
Austin Schuh2dc8c7d2021-07-01 17:41:28 -0700563 return channel_source_state_[channel_index]->monotonic_start_time(
564 boot_count);
Austin Schuh5ee56872021-01-30 16:53:34 -0800565 }
566
Austin Schuh58646e22021-08-23 23:51:46 -0700567 void DestroyEventLoop() { event_loop_unique_ptr_.reset(); }
568
569 EventLoop *MakeEventLoop() {
570 CHECK(!event_loop_unique_ptr_);
James Kuszmaul890c2492022-04-06 14:59:31 -0700571 // TODO(james): Enable exclusive senders on LogReader to allow us to
572 // ensure we are remapping channels correctly.
573 event_loop_unique_ptr_ = node_event_loop_factory_->MakeEventLoop(
574 "log_reader", {NodeEventLoopFactory::CheckSentTooFast::kNo,
James Kuszmaul94ca5132022-07-19 09:11:08 -0700575 NodeEventLoopFactory::ExclusiveSenders::kYes,
576 NonExclusiveChannels()});
Austin Schuh58646e22021-08-23 23:51:46 -0700577 return event_loop_unique_ptr_.get();
578 }
579
Austin Schuh2f8fd752020-09-01 22:38:28 -0700580 distributed_clock::time_point RemoteToDistributedClock(
581 size_t channel_index, monotonic_clock::time_point time) {
James Kuszmaul09632422022-05-25 15:56:19 -0700582 CHECK(node_event_loop_factory_);
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700583 return channel_source_state_[channel_index]
584 ->node_event_loop_factory_->ToDistributedClock(time);
Austin Schuh2f8fd752020-09-01 22:38:28 -0700585 }
586
587 const Node *remote_node(size_t channel_index) {
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700588 return channel_source_state_[channel_index]
589 ->node_event_loop_factory_->node();
Austin Schuh2f8fd752020-09-01 22:38:28 -0700590 }
591
Stephan Pleines559fa6c2022-01-06 17:23:51 -0800592 monotonic_clock::time_point monotonic_now() const {
Alexei Strotsb8c3a702023-04-19 21:38:25 -0700593 CHECK_NOTNULL(event_loop_);
James Kuszmaul09632422022-05-25 15:56:19 -0700594 return event_loop_->monotonic_now();
Austin Schuh2f8fd752020-09-01 22:38:28 -0700595 }
596
Austin Schuh858c9f32020-08-31 16:56:12 -0700597 // Sets the number of channels.
598 void SetChannelCount(size_t count);
599
600 // Sets the sender, filter, and target factory for a channel.
Austin Schuh969cd602021-01-03 00:09:45 -0800601 void SetChannel(size_t logged_channel_index, size_t factory_channel_index,
602 std::unique_ptr<RawSender> sender,
603 message_bridge::NoncausalOffsetEstimator *filter,
Austin Schuh58646e22021-08-23 23:51:46 -0700604 bool is_forwarded, State *source_state);
605
606 void SetRemoteTimestampSender(size_t logged_channel_index,
607 RemoteMessageSender *remote_timestamp_sender);
608
609 void RunOnStart();
610 void RunOnEnd();
Austin Schuh858c9f32020-08-31 16:56:12 -0700611
Austin Schuhe33c08d2022-02-03 18:15:21 -0800612 // Handles a logfile start event to potentially call the OnStart callbacks.
613 void NotifyLogfileStart();
614 // Handles a start time flag start event to potentially call the OnStart
615 // callbacks.
616 void NotifyFlagStart();
617
618 // Handles a logfile end event to potentially call the OnEnd callbacks.
619 void NotifyLogfileEnd();
620 // Handles a end time flag start event to potentially call the OnEnd
621 // callbacks.
622 void NotifyFlagEnd();
623
Austin Schuh858c9f32020-08-31 16:56:12 -0700624 // Unregisters everything so we can destory the event loop.
Austin Schuh58646e22021-08-23 23:51:46 -0700625 // TODO(austin): Is this needed? OnShutdown should be able to serve this
626 // need.
Austin Schuh858c9f32020-08-31 16:56:12 -0700627 void Deregister();
628
629 // Sets the current TimerHandle for the replay callback.
630 void set_timer_handler(TimerHandler *timer_handler) {
631 timer_handler_ = timer_handler;
Austin Schuh58646e22021-08-23 23:51:46 -0700632 if (timer_handler_) {
633 if (event_loop_->node() != nullptr) {
634 timer_handler_->set_name(absl::StrCat(
635 event_loop_->node()->name()->string_view(), "_main"));
636 } else {
637 timer_handler_->set_name("main");
638 }
639 }
Austin Schuh858c9f32020-08-31 16:56:12 -0700640 }
641
Austin Schuhe33c08d2022-02-03 18:15:21 -0800642 // Creates and registers the --start_time and --end_time event callbacks.
643 void SetStartTimeFlag(realtime_clock::time_point start_time);
644 void SetEndTimeFlag(realtime_clock::time_point end_time);
645
646 // Notices the next message to update the start/end time callbacks.
647 void ObserveNextMessage(monotonic_clock::time_point monotonic_event,
648 realtime_clock::time_point realtime_event);
649
650 // Clears the start and end time flag handlers so we can delete the event
651 // loop.
652 void ClearTimeFlags();
653
Austin Schuh858c9f32020-08-31 16:56:12 -0700654 // Sets the next wakeup time on the replay callback.
655 void Setup(monotonic_clock::time_point next_time) {
James Kuszmaul8866e642022-06-10 16:00:36 -0700656 timer_handler_->Setup(
657 std::max(monotonic_now(), next_time + clock_offset()));
Austin Schuh858c9f32020-08-31 16:56:12 -0700658 }
659
660 // Sends a buffer on the provided channel index.
Austin Schuh287d43d2020-12-04 20:19:33 -0800661 bool Send(const TimestampedMessage &timestamped_message);
Austin Schuh858c9f32020-08-31 16:56:12 -0700662
James Kuszmaulc3f34d12022-08-15 15:57:55 -0700663 void MaybeSetClockOffset();
James Kuszmaul09632422022-05-25 15:56:19 -0700664 std::chrono::nanoseconds clock_offset() const { return clock_offset_; }
665
Austin Schuh858c9f32020-08-31 16:56:12 -0700666 // Returns a debug string for the channel merger.
Austin Schuh2f8fd752020-09-01 22:38:28 -0700667 std::string DebugString() const {
Austin Schuh287d43d2020-12-04 20:19:33 -0800668 if (!timestamp_mapper_) {
Austin Schuhe639ea12021-01-25 13:00:22 -0800669 return "";
Austin Schuh287d43d2020-12-04 20:19:33 -0800670 }
Austin Schuhe639ea12021-01-25 13:00:22 -0800671 return timestamp_mapper_->DebugString();
Austin Schuh2f8fd752020-09-01 22:38:28 -0700672 }
Austin Schuh858c9f32020-08-31 16:56:12 -0700673
Austin Schuh58646e22021-08-23 23:51:46 -0700674 void ClearRemoteTimestampSenders() {
675 channel_timestamp_loggers_.clear();
676 timestamp_loggers_.clear();
677 }
678
Austin Schuhbd5f74a2021-11-11 20:55:38 -0800679 void SetFoundLastMessage(bool val) {
680 found_last_message_ = val;
681 last_message_.resize(factory_channel_index_.size(), false);
682 }
683 bool found_last_message() const { return found_last_message_; }
684
685 void set_last_message(size_t channel_index) {
686 CHECK_LT(channel_index, last_message_.size());
687 last_message_[channel_index] = true;
688 }
689
690 bool last_message(size_t channel_index) {
691 CHECK_LT(channel_index, last_message_.size());
692 return last_message_[channel_index];
693 }
694
James Kuszmaula16a7912022-06-17 10:58:12 -0700695 void set_timing_accuracy_sender(
696 aos::Sender<timing::ReplayTiming> timing_sender) {
697 timing_statistics_sender_ = std::move(timing_sender);
698 OnEnd([this]() { SendMessageTimings(); });
699 }
700
701 // If running with ThreadedBuffering::kYes, will start the processing thread
702 // and queue up messages until the specified time. No-op of
703 // ThreadedBuffering::kNo is set. Should only be called once.
704 void QueueThreadUntil(BootTimestamp time);
705
Austin Schuh858c9f32020-08-31 16:56:12 -0700706 private:
James Kuszmaulc3f34d12022-08-15 15:57:55 -0700707 void TrackMessageSendTiming(const RawSender &sender,
708 monotonic_clock::time_point expected_send_time);
James Kuszmaula16a7912022-06-17 10:58:12 -0700709 void SendMessageTimings();
Austin Schuh858c9f32020-08-31 16:56:12 -0700710 // Log file.
Austin Schuh287d43d2020-12-04 20:19:33 -0800711 std::unique_ptr<TimestampMapper> timestamp_mapper_;
Austin Schuh858c9f32020-08-31 16:56:12 -0700712
Austin Schuh858c9f32020-08-31 16:56:12 -0700713 // Senders.
714 std::vector<std::unique_ptr<RawSender>> channels_;
Austin Schuh969cd602021-01-03 00:09:45 -0800715 std::vector<RemoteMessageSender *> remote_timestamp_senders_;
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700716 // The mapping from logged channel index to sent channel index. Needed for
717 // sending out MessageHeaders.
718 std::vector<int> factory_channel_index_;
719
Austin Schuh9942bae2021-01-07 22:06:44 -0800720 struct ContiguousSentTimestamp {
721 // Most timestamps make it through the network, so it saves a ton of
722 // memory and CPU to store the start and end, and search for valid ranges.
723 // For one of the logs I looked at, we had 2 ranges for 4 days.
724 //
725 // Save monotonic times as well to help if a queue index ever wraps. Odds
726 // are very low, but doesn't hurt.
727 //
728 // The starting time and matching queue index.
729 monotonic_clock::time_point starting_monotonic_event_time =
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700730 monotonic_clock::min_time;
Austin Schuh9942bae2021-01-07 22:06:44 -0800731 uint32_t starting_queue_index = 0xffffffff;
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700732
Austin Schuh9942bae2021-01-07 22:06:44 -0800733 // Ending time and queue index.
734 monotonic_clock::time_point ending_monotonic_event_time =
735 monotonic_clock::max_time;
736 uint32_t ending_queue_index = 0xffffffff;
737
738 // The queue index that the first message was *actually* sent with. The
739 // queue indices are assumed to be contiguous through this range.
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700740 uint32_t actual_queue_index = 0xffffffff;
741 };
742
James Kuszmaul94ca5132022-07-19 09:11:08 -0700743 // Returns a list of channels which LogReader will send on but which may
744 // *also* get sent on by other applications in replay.
745 std::vector<
746 std::pair<const aos::Channel *, NodeEventLoopFactory::ExclusiveSenders>>
747 NonExclusiveChannels();
748
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700749 // Stores all the timestamps that have been sent on this channel. This is
750 // only done for channels which are forwarded and on the node which
Austin Schuh9942bae2021-01-07 22:06:44 -0800751 // initially sends the message. Compress using ranges and offsets.
752 std::vector<std::unique_ptr<std::vector<ContiguousSentTimestamp>>>
753 queue_index_map_;
Austin Schuh858c9f32020-08-31 16:56:12 -0700754
755 // Factory (if we are in sim) that this loop was created on.
756 NodeEventLoopFactory *node_event_loop_factory_ = nullptr;
Austin Schuhe33c08d2022-02-03 18:15:21 -0800757 SimulatedEventLoopFactory *event_loop_factory_ = nullptr;
758
James Kuszmaulb11a1502022-07-01 16:02:25 -0700759 // Callback for when this node hits its realtime end time.
760 std::function<void()> notice_realtime_end_;
761
Austin Schuh858c9f32020-08-31 16:56:12 -0700762 std::unique_ptr<EventLoop> event_loop_unique_ptr_;
763 // Event loop.
Austin Schuh58646e22021-08-23 23:51:46 -0700764 const Node *node_ = nullptr;
Austin Schuh858c9f32020-08-31 16:56:12 -0700765 EventLoop *event_loop_ = nullptr;
766 // And timer used to send messages.
Austin Schuh58646e22021-08-23 23:51:46 -0700767 TimerHandler *timer_handler_ = nullptr;
768 TimerHandler *startup_timer_ = nullptr;
Austin Schuh858c9f32020-08-31 16:56:12 -0700769
Austin Schuhe33c08d2022-02-03 18:15:21 -0800770 std::unique_ptr<EventNotifier> start_event_notifier_;
771 std::unique_ptr<EventNotifier> end_event_notifier_;
772
Austin Schuh8bd96322020-02-13 21:18:22 -0800773 // Filters (or nullptr if it isn't a forwarded channel) for each channel.
774 // This corresponds to the object which is shared among all the channels
775 // going between 2 nodes. The second element in the tuple indicates if this
776 // is the primary direction or not.
Austin Schuh2f8fd752020-09-01 22:38:28 -0700777 std::vector<message_bridge::NoncausalOffsetEstimator *> filters_;
James Kuszmaul09632422022-05-25 15:56:19 -0700778 message_bridge::MultiNodeNoncausalOffsetEstimator *multinode_filters_;
Austin Schuh8bd96322020-02-13 21:18:22 -0800779
Austin Schuh84dd1332023-05-03 13:09:47 -0700780 // List of States (or nullptr if it isn't a forwarded channel) which
781 // correspond to the originating node.
Austin Schuh8d7e0bb2020-10-02 17:57:00 -0700782 std::vector<State *> channel_source_state_;
783
Austin Schuh61e973f2021-02-21 21:43:56 -0800784 // This is a cache for channel, connection mapping to the corresponding
785 // sender.
786 absl::btree_map<std::pair<const Channel *, const Connection *>,
787 std::shared_ptr<RemoteMessageSender>>
788 channel_timestamp_loggers_;
789
790 // Mapping from resolved RemoteMessage channel to RemoteMessage sender. This
791 // is the channel that timestamps are published to.
792 absl::btree_map<const Channel *, std::shared_ptr<RemoteMessageSender>>
793 timestamp_loggers_;
Austin Schuh58646e22021-08-23 23:51:46 -0700794
James Kuszmaul09632422022-05-25 15:56:19 -0700795 // Time offset between the log's monotonic clock and the current event
796 // loop's monotonic clock. Useful when replaying logs with non-simulated
797 // event loops.
798 std::chrono::nanoseconds clock_offset_{0};
799
Austin Schuh58646e22021-08-23 23:51:46 -0700800 std::vector<std::function<void()>> on_starts_;
801 std::vector<std::function<void()>> on_ends_;
802
James Kuszmaula16a7912022-06-17 10:58:12 -0700803 std::atomic<bool> stopped_ = false;
804 std::atomic<bool> started_ = false;
Austin Schuhbd5f74a2021-11-11 20:55:38 -0800805
806 bool found_last_message_ = false;
807 std::vector<bool> last_message_;
James Kuszmaula16a7912022-06-17 10:58:12 -0700808
809 std::vector<timing::MessageTimingT> send_timings_;
810 aos::Sender<timing::ReplayTiming> timing_statistics_sender_;
811
812 // Protects access to any internal state after Run() is called. Designed
813 // assuming that only one node is actually executing in replay.
814 // Threading design:
815 // * The worker passed to message_queuer_ has full ownership over all
816 // the log-reading code, timestamp filters, last_queued_message_, etc.
817 // * The main thread should only have exclusive access to the replay
818 // event loop and associated features (mainly senders).
819 // It will pop an item out of the queue (which does maintain a shared_ptr
820 // reference which may also be being used by the message_queuer_ thread,
821 // but having shared_ptr's accessing the same memory from
822 // separate threads is permissible).
823 // Enabling this in simulation is currently infeasible due to a lack of
824 // synchronization in the MultiNodeNoncausalOffsetEstimator. Essentially,
825 // when the message_queuer_ thread attempts to read/pop messages from the
826 // timestamp_mapper_, it will end up calling callbacks that update the
827 // internal state of the MultiNodeNoncausalOffsetEstimator. Simultaneously,
828 // the event scheduler that is running in the main thread to orchestrate the
829 // simulation will be querying the estimator to know what the clocks on the
830 // various nodes are at, leading to potential issues.
831 ThreadedBuffering threading_;
832 std::optional<BootTimestamp> last_queued_message_;
833 std::optional<util::ThreadedQueue<TimestampedMessage, BootTimestamp>>
834 message_queuer_;
Eric Schmiedebergb38477e2022-12-02 16:08:04 -0700835
836 // If a ReplayChannels was passed to LogReader, this will hold the
837 // indices of the channels to replay for the Node represented by
838 // the instance of LogReader::State.
Naman Guptacf6d4422023-03-01 11:41:00 -0800839 std::unique_ptr<const ReplayChannelIndices> replay_channel_indices_;
Austin Schuh6f3babe2020-01-26 20:34:50 -0800840 };
841
Eric Schmiedebergb38477e2022-12-02 16:08:04 -0700842 // If a ReplayChannels was passed to LogReader then creates a
Naman Guptacf6d4422023-03-01 11:41:00 -0800843 // ReplayChannelIndices for the given node. Otherwise, returns a nullptr.
844 std::unique_ptr<const ReplayChannelIndices> MaybeMakeReplayChannelIndices(
Eric Schmiedebergb38477e2022-12-02 16:08:04 -0700845 const Node *node);
846
Austin Schuh8bd96322020-02-13 21:18:22 -0800847 // Node index -> State.
848 std::vector<std::unique_ptr<State>> states_;
849
850 // Creates the requested filter if it doesn't exist, regardless of whether
851 // these nodes can actually communicate directly. The second return value
852 // reports if this is the primary direction or not.
Austin Schuh2f8fd752020-09-01 22:38:28 -0700853 message_bridge::NoncausalOffsetEstimator *GetFilter(const Node *node_a,
854 const Node *node_b);
Austin Schuh8bd96322020-02-13 21:18:22 -0800855
Austin Schuh8bd96322020-02-13 21:18:22 -0800856 // List of filters for a connection. The pointer to the first node will be
857 // less than the second node.
Austin Schuh0ca1fd32020-12-18 22:53:05 -0800858 std::unique_ptr<message_bridge::MultiNodeNoncausalOffsetEstimator> filters_;
Austin Schuh8bd96322020-02-13 21:18:22 -0800859
James Kuszmaul84ff3e52020-01-03 19:48:53 -0800860 std::unique_ptr<FlatbufferDetachedBuffer<Configuration>>
861 remapped_configuration_buffer_;
862
James Kuszmaul84ff3e52020-01-03 19:48:53 -0800863 std::unique_ptr<SimulatedEventLoopFactory> event_loop_factory_unique_ptr_;
864 SimulatedEventLoopFactory *event_loop_factory_ = nullptr;
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800865
866 // Map of channel indices to new name. The channel index will be an index into
867 // logged_configuration(), and the string key will be the name of the channel
868 // to send on instead of the logged channel name.
Austin Schuh0de30f32020-12-06 12:44:28 -0800869 struct RemappedChannel {
870 std::string remapped_name;
871 std::string new_type;
872 };
873 std::map<size_t, RemappedChannel> remapped_channels_;
Austin Schuh01b4c352020-09-21 23:09:39 -0700874 std::vector<MapT> maps_;
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800875
Austin Schuh6f3babe2020-01-26 20:34:50 -0800876 // Number of nodes which still have data to send. This is used to figure out
877 // when to exit.
878 size_t live_nodes_ = 0;
879
James Kuszmaulb11a1502022-07-01 16:02:25 -0700880 // Similar counter to live_nodes_, but for tracking which individual nodes are
881 // running and have yet to hit the realtime end time, if any.
882 size_t live_nodes_with_realtime_time_end_ = 0;
883
James Kuszmaulc7bbb3e2020-01-03 20:01:00 -0800884 const Configuration *remapped_configuration_ = nullptr;
885 const Configuration *replay_configuration_ = nullptr;
Austin Schuhcde938c2020-02-02 17:30:07 -0800886
Eric Schmiedebergb38477e2022-12-02 16:08:04 -0700887 // If a ReplayChannels was passed to LogReader, this will hold the
888 // name and type of channels to replay which is used when creating States.
889 const ReplayChannels *replay_channels_ = nullptr;
890
Austin Schuhcde938c2020-02-02 17:30:07 -0800891 // If true, the replay timer will ignore any missing data. This is used
892 // during startup when we are bootstrapping everything and trying to get to
893 // the start of all the log files.
894 bool ignore_missing_data_ = false;
James Kuszmaul71a81932020-12-15 21:08:01 -0800895
896 // Whether to exit the SimulatedEventLoop when we finish reading the logs.
897 bool exit_on_finish_ = true;
Austin Schuhe33c08d2022-02-03 18:15:21 -0800898
899 realtime_clock::time_point start_time_ = realtime_clock::min_time;
900 realtime_clock::time_point end_time_ = realtime_clock::max_time;
Austin Schuhe309d2a2019-11-29 13:25:21 -0800901};
902
903} // namespace logger
904} // namespace aos
905
Austin Schuhb06f03b2021-02-17 22:00:37 -0800906#endif // AOS_EVENTS_LOGGING_LOG_READER_H_