blob: 0c87e4df5f9b10f2c1036174693888cc6344c66f [file] [log] [blame]
Austin Schuh20b2b082019-09-11 20:42:56 -07001#include "aos/ipc_lib/lockless_queue.h"
2
3#include <linux/futex.h>
4#include <sys/types.h>
5#include <syscall.h>
6#include <unistd.h>
7#include <algorithm>
8#include <iomanip>
9#include <iostream>
10#include <sstream>
11
Austin Schuh20b2b082019-09-11 20:42:56 -070012#include "aos/ipc_lib/lockless_queue_memory.h"
Alex Perrycb7da4b2019-08-28 19:35:56 -070013#include "aos/realtime.h"
Austin Schuh20b2b082019-09-11 20:42:56 -070014#include "aos/util/compiler_memory_barrier.h"
Austin Schuhf257f3c2019-10-27 21:00:43 -070015#include "glog/logging.h"
Austin Schuh20b2b082019-09-11 20:42:56 -070016
17namespace aos {
18namespace ipc_lib {
Austin Schuh20b2b082019-09-11 20:42:56 -070019namespace {
20
Brian Silvermanfafe1fa2019-12-18 21:42:18 -080021class GrabQueueSetupLockOrDie {
22 public:
23 GrabQueueSetupLockOrDie(LocklessQueueMemory *memory) : memory_(memory) {
24 const int result = mutex_grab(&(memory->queue_setup_lock));
25 CHECK(result == 0 || result == 1) << ": " << result;
26 }
Austin Schuh20b2b082019-09-11 20:42:56 -070027
Brian Silvermanfafe1fa2019-12-18 21:42:18 -080028 ~GrabQueueSetupLockOrDie() { mutex_unlock(&(memory_->queue_setup_lock)); }
29
30 GrabQueueSetupLockOrDie(const GrabQueueSetupLockOrDie &) = delete;
31 GrabQueueSetupLockOrDie &operator=(const GrabQueueSetupLockOrDie &) = delete;
32
33 private:
34 LocklessQueueMemory *const memory_;
35};
36
37void Cleanup(LocklessQueueMemory *memory, const GrabQueueSetupLockOrDie &) {
38 // Make sure we start looking at shared memory fresh right now. We'll handle
39 // people dying partway through by either cleaning up after them or not, but
40 // we want to ensure we clean up after anybody who has already died when we
41 // start.
42 aos_compiler_memory_barrier();
43
Austin Schuh20b2b082019-09-11 20:42:56 -070044 const size_t num_senders = memory->num_senders();
45 const size_t queue_size = memory->queue_size();
46 const size_t num_messages = memory->num_messages();
47
48 // There are a large number of crazy cases here for how things can go wrong
49 // and how we have to recover. They either require us to keep extra track of
50 // what is going on, slowing down the send path, or require a large number of
51 // cases.
52 //
53 // The solution here is to not over-think it. This is running while not real
54 // time during construction. It is allowed to be slow. It will also very
55 // rarely trigger. There is a small uS window where process death is
56 // ambiguous.
57 //
58 // So, build up a list N long, where N is the number of messages. Search
59 // through the entire queue and the sender list (ignoring any dead senders),
60 // and mark down which ones we have seen. Once we have seen all the messages
61 // except the N dead senders, we know which messages are dead. Because the
62 // queue is active while we do this, it may take a couple of go arounds to see
63 // everything.
64
65 // Do the easy case. Find all senders who have died. See if they are either
66 // consistent already, or if they have copied over to_replace to the scratch
67 // index, but haven't cleared to_replace. Count them.
68 size_t valid_senders = 0;
69 for (size_t i = 0; i < num_senders; ++i) {
70 Sender *sender = memory->GetSender(i);
71 const uint32_t tid =
Brian Silvermanfafe1fa2019-12-18 21:42:18 -080072 __atomic_load_n(&(sender->tid.futex), __ATOMIC_ACQUIRE);
Austin Schuh20b2b082019-09-11 20:42:56 -070073 if (tid & FUTEX_OWNER_DIED) {
Alex Perrycb7da4b2019-08-28 19:35:56 -070074 VLOG(3) << "Found an easy death for sender " << i;
Brian Silvermanfafe1fa2019-12-18 21:42:18 -080075 // We can do a relaxed load here because we're the only person touching
76 // this sender at this point.
Austin Schuh20b2b082019-09-11 20:42:56 -070077 const Index to_replace = sender->to_replace.RelaxedLoad();
78 const Index scratch_index = sender->scratch_index.Load();
79
80 // I find it easiest to think about this in terms of the set of observable
Brian Silvermanfafe1fa2019-12-18 21:42:18 -080081 // states. The main code progresses through the following states:
Austin Schuh20b2b082019-09-11 20:42:56 -070082
83 // 1) scratch_index = xxx
84 // to_replace = invalid
85 // This is unambiguous. Already good.
86
87 // 2) scratch_index = xxx
88 // to_replace = yyy
89 // Very ambiguous. Is xxx or yyy the correct one? Need to either roll
90 // this forwards or backwards.
91
92 // 3) scratch_index = yyy
93 // to_replace = yyy
94 // We are in the act of moving to_replace to scratch_index, but didn't
95 // finish. Easy.
96
97 // 4) scratch_index = yyy
98 // to_replace = invalid
99 // Finished, but died. Looks like 1)
100
101 // Any cleanup code needs to follow the same set of states to be robust to
102 // death, so death can be restarted.
103
104 // Could be 2) or 3).
105 if (to_replace.valid()) {
106 // 3)
107 if (to_replace == scratch_index) {
108 // Just need to invalidate to_replace to finish.
109 sender->to_replace.Invalidate();
110
111 // And mark that we succeeded.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800112 __atomic_store_n(&(sender->tid.futex), 0, __ATOMIC_RELEASE);
Austin Schuh20b2b082019-09-11 20:42:56 -0700113 ++valid_senders;
114 }
115 } else {
116 // 1) or 4). Make sure we aren't corrupted and declare victory.
117 CHECK(scratch_index.valid());
118
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800119 __atomic_store_n(&(sender->tid.futex), 0, __ATOMIC_RELEASE);
Austin Schuh20b2b082019-09-11 20:42:56 -0700120 ++valid_senders;
121 }
122 } else {
123 // Not dead.
124 ++valid_senders;
125 }
126 }
127
128 // If all the senders are (or were made) good, there is no need to do the hard
129 // case.
130 if (valid_senders == num_senders) {
131 return;
132 }
133
Alex Perrycb7da4b2019-08-28 19:35:56 -0700134 VLOG(3) << "Starting hard cleanup";
Austin Schuh20b2b082019-09-11 20:42:56 -0700135
136 size_t num_accounted_for = 0;
137 size_t num_missing = 0;
138 ::std::vector<bool> accounted_for(num_messages, false);
139
140 while ((num_accounted_for + num_missing) != num_messages) {
141 num_missing = 0;
142 for (size_t i = 0; i < num_senders; ++i) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800143 Sender *const sender = memory->GetSender(i);
Austin Schuh20b2b082019-09-11 20:42:56 -0700144 const uint32_t tid =
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800145 __atomic_load_n(&(sender->tid.futex), __ATOMIC_ACQUIRE);
Austin Schuh20b2b082019-09-11 20:42:56 -0700146 if (tid & FUTEX_OWNER_DIED) {
147 ++num_missing;
148 } else {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800149 // We can do a relaxed load here because we're the only person touching
150 // this sender at this point, if it matters. If it's not a dead sender,
151 // then any message it every has will already be accounted for, so this
152 // will always be a NOP.
Austin Schuh20b2b082019-09-11 20:42:56 -0700153 const Index scratch_index = sender->scratch_index.RelaxedLoad();
154 if (!accounted_for[scratch_index.message_index()]) {
155 ++num_accounted_for;
156 }
157 accounted_for[scratch_index.message_index()] = true;
158 }
159 }
160
161 for (size_t i = 0; i < queue_size; ++i) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800162 // Same logic as above for scratch_index applies here too.
Austin Schuh20b2b082019-09-11 20:42:56 -0700163 const Index index = memory->GetQueue(i)->RelaxedLoad();
164 if (!accounted_for[index.message_index()]) {
165 ++num_accounted_for;
166 }
167 accounted_for[index.message_index()] = true;
168 }
169 }
170
171 while (num_missing != 0) {
172 const size_t starting_num_missing = num_missing;
173 for (size_t i = 0; i < num_senders; ++i) {
174 Sender *sender = memory->GetSender(i);
175 const uint32_t tid =
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800176 __atomic_load_n(&(sender->tid.futex), __ATOMIC_ACQUIRE);
Austin Schuh20b2b082019-09-11 20:42:56 -0700177 if (tid & FUTEX_OWNER_DIED) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800178 // We can do relaxed loads here because we're the only person touching
179 // this sender at this point.
Austin Schuh20b2b082019-09-11 20:42:56 -0700180 const Index scratch_index = sender->scratch_index.RelaxedLoad();
181 const Index to_replace = sender->to_replace.RelaxedLoad();
182
183 // Candidate.
184 CHECK_LE(to_replace.message_index(), accounted_for.size());
185 if (accounted_for[to_replace.message_index()]) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700186 VLOG(3) << "Sender " << i
187 << " died, to_replace is already accounted for";
Austin Schuh20b2b082019-09-11 20:42:56 -0700188 // If both are accounted for, we are corrupt...
189 CHECK(!accounted_for[scratch_index.message_index()]);
190
191 // to_replace is already accounted for. This means that we didn't
192 // atomically insert scratch_index into the queue yet. So
193 // invalidate to_replace.
194 sender->to_replace.Invalidate();
195
196 // And then mark this sender clean.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800197 __atomic_store_n(&(sender->tid.futex), 0, __ATOMIC_RELEASE);
Austin Schuh20b2b082019-09-11 20:42:56 -0700198
199 // And account for scratch_index.
200 accounted_for[scratch_index.message_index()] = true;
201 --num_missing;
202 ++num_accounted_for;
203 } else if (accounted_for[scratch_index.message_index()]) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700204 VLOG(3) << "Sender " << i
205 << " died, scratch_index is already accounted for";
Austin Schuh20b2b082019-09-11 20:42:56 -0700206 // scratch_index is accounted for. That means we did the insert,
207 // but didn't record it.
208 CHECK(to_replace.valid());
209 // Finish the transaction. Copy to_replace, then clear it.
210
211 sender->scratch_index.Store(to_replace);
212 sender->to_replace.Invalidate();
213
214 // And then mark this sender clean.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800215 __atomic_store_n(&(sender->tid.futex), 0, __ATOMIC_RELEASE);
Austin Schuh20b2b082019-09-11 20:42:56 -0700216
217 // And account for to_replace.
218 accounted_for[to_replace.message_index()] = true;
219 --num_missing;
220 ++num_accounted_for;
221 } else {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700222 VLOG(3) << "Sender " << i << " died, neither is accounted for";
Austin Schuh20b2b082019-09-11 20:42:56 -0700223 // Ambiguous. There will be an unambiguous one somewhere that we
224 // can do first.
225 }
226 }
227 }
228 // CHECK that we are making progress.
229 CHECK_NE(num_missing, starting_num_missing);
230 }
231}
232
233// Exposes rt_tgsigqueueinfo so we can send the signal *just* to the target
234// thread.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800235// TODO(Brian): Do directly in assembly for armhf at least for efficiency.
Austin Schuh20b2b082019-09-11 20:42:56 -0700236int rt_tgsigqueueinfo(pid_t tgid, pid_t tid, int sig, siginfo_t *si) {
237 return syscall(SYS_rt_tgsigqueueinfo, tgid, tid, sig, si);
238}
239
240} // namespace
241
242size_t LocklessQueueMemorySize(LocklessQueueConfiguration config) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800243 // Round up the message size so following data is aligned appropriately.
244 config.message_data_size =
245 LocklessQueueMemory::AlignmentRoundUp(config.message_data_size);
Austin Schuh20b2b082019-09-11 20:42:56 -0700246
247 // As we build up the size, confirm that everything is aligned to the
248 // alignment requirements of the type.
249 size_t size = sizeof(LocklessQueueMemory);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800250 CHECK_EQ(size % alignof(LocklessQueueMemory), 0u);
Austin Schuh20b2b082019-09-11 20:42:56 -0700251
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800252 CHECK_EQ(size % alignof(AtomicIndex), 0u);
Austin Schuh20b2b082019-09-11 20:42:56 -0700253 size += LocklessQueueMemory::SizeOfQueue(config);
254
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800255 CHECK_EQ(size % alignof(Message), 0u);
Austin Schuh20b2b082019-09-11 20:42:56 -0700256 size += LocklessQueueMemory::SizeOfMessages(config);
257
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800258 CHECK_EQ(size % alignof(Watcher), 0u);
Austin Schuh20b2b082019-09-11 20:42:56 -0700259 size += LocklessQueueMemory::SizeOfWatchers(config);
260
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800261 CHECK_EQ(size % alignof(Sender), 0u);
Austin Schuh20b2b082019-09-11 20:42:56 -0700262 size += LocklessQueueMemory::SizeOfSenders(config);
263
264 return size;
265}
266
267LocklessQueueMemory *InitializeLocklessQueueMemory(
268 LocklessQueueMemory *memory, LocklessQueueConfiguration config) {
269 // Everything should be zero initialized already. So we just need to fill
270 // everything out properly.
271
272 // Grab the mutex. We don't care if the previous reader died. We are going
273 // to check everything anyways.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800274 GrabQueueSetupLockOrDie grab_queue_setup_lock(memory);
Austin Schuh20b2b082019-09-11 20:42:56 -0700275
276 if (!memory->initialized) {
277 // TODO(austin): Check these for out of bounds.
278 memory->config.num_watchers = config.num_watchers;
279 memory->config.num_senders = config.num_senders;
280 memory->config.queue_size = config.queue_size;
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800281 memory->config.message_data_size =
282 LocklessQueueMemory::AlignmentRoundUp(config.message_data_size);
Austin Schuh20b2b082019-09-11 20:42:56 -0700283
284 const size_t num_messages = memory->num_messages();
285 // There need to be at most MaxMessages() messages allocated.
286 CHECK_LE(num_messages, Index::MaxMessages());
287
288 for (size_t i = 0; i < num_messages; ++i) {
289 memory->GetMessage(Index(QueueIndex::Zero(memory->queue_size()), i))
290 ->header.queue_index.Invalidate();
291 }
292
293 for (size_t i = 0; i < memory->queue_size(); ++i) {
294 // Make the initial counter be the furthest away number. That means that
295 // index 0 should be 0xffff, 1 should be 0, etc.
296 memory->GetQueue(i)->Store(Index(QueueIndex::Zero(memory->queue_size())
297 .IncrementBy(i)
298 .DecrementBy(memory->queue_size()),
299 i));
300 }
301
302 memory->next_queue_index.Invalidate();
303
304 for (size_t i = 0; i < memory->num_senders(); ++i) {
305 ::aos::ipc_lib::Sender *s = memory->GetSender(i);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800306 // Nobody else can possibly be touching these because we haven't set
307 // initialized to true yet.
308 s->scratch_index.RelaxedStore(Index(0xffff, i + memory->queue_size()));
Austin Schuh20b2b082019-09-11 20:42:56 -0700309 s->to_replace.RelaxedInvalidate();
310 }
311
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800312 aos_compiler_memory_barrier();
Austin Schuh20b2b082019-09-11 20:42:56 -0700313 // Signal everything is done. This needs to be done last, so if we die, we
314 // redo initialization.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800315 memory->initialized = true;
Austin Schuh20b2b082019-09-11 20:42:56 -0700316 }
317
Austin Schuh20b2b082019-09-11 20:42:56 -0700318 return memory;
319}
320
321LocklessQueue::LocklessQueue(LocklessQueueMemory *memory,
322 LocklessQueueConfiguration config)
323 : memory_(InitializeLocklessQueueMemory(memory, config)),
324 watcher_copy_(memory_->num_watchers()),
325 pid_(getpid()),
326 uid_(getuid()) {}
327
328LocklessQueue::~LocklessQueue() {
329 CHECK_EQ(watcher_index_, -1);
330
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800331 GrabQueueSetupLockOrDie grab_queue_setup_lock(memory_);
Austin Schuh20b2b082019-09-11 20:42:56 -0700332 const int num_watchers = memory_->num_watchers();
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800333 // Cleanup is cheap. The next user will do it anyways, so no need for us to do
334 // anything right now.
Austin Schuh20b2b082019-09-11 20:42:56 -0700335
336 // And confirm that nothing is owned by us.
337 for (int i = 0; i < num_watchers; ++i) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800338 CHECK(!death_notification_is_held(&(memory_->GetWatcher(i)->tid)));
Austin Schuh20b2b082019-09-11 20:42:56 -0700339 }
Austin Schuh20b2b082019-09-11 20:42:56 -0700340}
341
342size_t LocklessQueue::QueueSize() const { return memory_->queue_size(); }
343
344bool LocklessQueue::RegisterWakeup(int priority) {
345 // TODO(austin): Make sure signal coalescing is turned on. We don't need
346 // duplicates. That will improve performance under high load.
347
348 // Since everything is self consistent, all we need to do is make sure nobody
349 // else is running. Someone dying will get caught in the generic consistency
350 // check.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800351 GrabQueueSetupLockOrDie grab_queue_setup_lock(memory_);
Austin Schuh20b2b082019-09-11 20:42:56 -0700352 const int num_watchers = memory_->num_watchers();
353
354 // Now, find the first empty watcher and grab it.
355 CHECK_EQ(watcher_index_, -1);
356 for (int i = 0; i < num_watchers; ++i) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800357 // If we see a slot the kernel has marked as dead, everything we do reusing
358 // it needs to happen-after whatever that process did before dying.
Brian Silverman2484eea2019-12-21 16:48:46 -0800359 auto *const futex = &(memory_->GetWatcher(i)->tid.futex);
360 const uint32_t tid = __atomic_load_n(futex, __ATOMIC_ACQUIRE);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800361 if (tid == 0 || (tid & FUTEX_OWNER_DIED)) {
Austin Schuh20b2b082019-09-11 20:42:56 -0700362 watcher_index_ = i;
Brian Silverman2484eea2019-12-21 16:48:46 -0800363 // Relaxed is OK here because we're the only task going to touch it
364 // between here and the write in death_notification_init below (other
365 // recovery is blocked by us holding the setup lock).
366 __atomic_store_n(futex, 0, __ATOMIC_RELAXED);
Austin Schuh20b2b082019-09-11 20:42:56 -0700367 break;
368 }
369 }
370
371 // Bail if we failed to find an open slot.
372 if (watcher_index_ == -1) {
Austin Schuh20b2b082019-09-11 20:42:56 -0700373 return false;
374 }
375
376 Watcher *w = memory_->GetWatcher(watcher_index_);
377
378 w->pid = getpid();
379 w->priority = priority;
380
381 // Grabbing a mutex is a compiler and memory barrier, so nothing before will
382 // get rearranged afterwords.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800383 death_notification_init(&(w->tid));
384 return true;
Austin Schuh20b2b082019-09-11 20:42:56 -0700385}
386
387void LocklessQueue::UnregisterWakeup() {
388 // Since everything is self consistent, all we need to do is make sure nobody
389 // else is running. Someone dying will get caught in the generic consistency
390 // check.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800391 GrabQueueSetupLockOrDie grab_queue_setup_lock(memory_);
Austin Schuh20b2b082019-09-11 20:42:56 -0700392
393 // Make sure we are registered.
394 CHECK_NE(watcher_index_, -1);
395
396 // Make sure we still own the slot we are supposed to.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800397 CHECK(
398 death_notification_is_held(&(memory_->GetWatcher(watcher_index_)->tid)));
Austin Schuh20b2b082019-09-11 20:42:56 -0700399
400 // The act of unlocking invalidates the entry. Invalidate it.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800401 death_notification_release(&(memory_->GetWatcher(watcher_index_)->tid));
Austin Schuh20b2b082019-09-11 20:42:56 -0700402 // And internally forget the slot.
403 watcher_index_ = -1;
Austin Schuh20b2b082019-09-11 20:42:56 -0700404}
405
406int LocklessQueue::Wakeup(const int current_priority) {
407 const size_t num_watchers = memory_->num_watchers();
408
409 CHECK_EQ(watcher_copy_.size(), num_watchers);
410
411 // Grab a copy so it won't change out from underneath us, and we can sort it
412 // nicely in C++.
413 // Do note that there is still a window where the process can die *after* we
414 // read everything. We will still PI boost and send a signal to the thread in
415 // question. There is no way without pidfd's to close this window, and
416 // creating a pidfd is likely not RT.
417 for (size_t i = 0; i < num_watchers; ++i) {
418 Watcher *w = memory_->GetWatcher(i);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800419 watcher_copy_[i].tid = __atomic_load_n(&(w->tid.futex), __ATOMIC_RELAXED);
420 // Force the load of the TID to come first.
421 aos_compiler_memory_barrier();
422 watcher_copy_[i].pid = w->pid.load(std::memory_order_relaxed);
423 watcher_copy_[i].priority = w->priority.load(std::memory_order_relaxed);
Austin Schuh20b2b082019-09-11 20:42:56 -0700424
425 // Use a priority of -1 to mean an invalid entry to make sorting easier.
426 if (watcher_copy_[i].tid & FUTEX_OWNER_DIED || watcher_copy_[i].tid == 0) {
427 watcher_copy_[i].priority = -1;
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800428 } else {
429 // Ensure all of this happens after we're done looking at the pid+priority
430 // in shared memory.
431 aos_compiler_memory_barrier();
432 if (watcher_copy_[i].tid != static_cast<pid_t>(__atomic_load_n(
433 &(w->tid.futex), __ATOMIC_RELAXED))) {
434 // Confirm that the watcher hasn't been re-used and modified while we
435 // read it. If it has, mark it invalid again.
436 watcher_copy_[i].priority = -1;
437 watcher_copy_[i].tid = 0;
438 }
Austin Schuh20b2b082019-09-11 20:42:56 -0700439 }
440 }
441
442 // Now sort.
443 ::std::sort(watcher_copy_.begin(), watcher_copy_.end(),
444 [](const WatcherCopy &a, const WatcherCopy &b) {
445 return a.priority > b.priority;
446 });
447
448 int count = 0;
449 if (watcher_copy_[0].priority != -1) {
450 const int max_priority =
451 ::std::max(current_priority, watcher_copy_[0].priority);
452 // Boost if we are RT and there is a higher priority sender out there.
453 // Otherwise we might run into priority inversions.
454 if (max_priority > current_priority && current_priority > 0) {
455 SetCurrentThreadRealtimePriority(max_priority);
456 }
457
458 // Build up the siginfo to send.
459 siginfo_t uinfo;
460 memset(&uinfo, 0, sizeof(uinfo));
461
462 uinfo.si_code = SI_QUEUE;
463 uinfo.si_pid = pid_;
464 uinfo.si_uid = uid_;
465 uinfo.si_value.sival_int = 0;
466
467 for (const WatcherCopy &watcher_copy : watcher_copy_) {
468 // The first -1 priority means we are at the end of the valid list.
469 if (watcher_copy.priority == -1) {
470 break;
471 }
472
473 // Send the signal. Target just the thread that sent it so that we can
474 // support multiple watchers in a process (when someone creates multiple
475 // event loops in different threads).
476 rt_tgsigqueueinfo(watcher_copy.pid, watcher_copy.tid, kWakeupSignal,
477 &uinfo);
478
479 ++count;
480 }
481
482 // Drop back down if we were boosted.
483 if (max_priority > current_priority && current_priority > 0) {
484 SetCurrentThreadRealtimePriority(current_priority);
485 }
486 }
487
488 return count;
489}
490
491LocklessQueue::Sender::Sender(LocklessQueueMemory *memory) : memory_(memory) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800492 GrabQueueSetupLockOrDie grab_queue_setup_lock(memory_);
Austin Schuh20b2b082019-09-11 20:42:56 -0700493
494 // Since we already have the lock, go ahead and try cleaning up.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800495 Cleanup(memory_, grab_queue_setup_lock);
Austin Schuh20b2b082019-09-11 20:42:56 -0700496
497 const int num_senders = memory_->num_senders();
498
499 for (int i = 0; i < num_senders; ++i) {
500 ::aos::ipc_lib::Sender *s = memory->GetSender(i);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800501 // This doesn't need synchronization because we're the only process doing
502 // initialization right now, and nobody else will be touching senders which
503 // we're interested in.
Austin Schuh20b2b082019-09-11 20:42:56 -0700504 const uint32_t tid = __atomic_load_n(&(s->tid.futex), __ATOMIC_RELAXED);
505 if (tid == 0) {
506 sender_index_ = i;
507 break;
508 }
509 }
510
511 if (sender_index_ == -1) {
Austin Schuhf257f3c2019-10-27 21:00:43 -0700512 LOG(FATAL) << "Too many senders";
Austin Schuh20b2b082019-09-11 20:42:56 -0700513 }
514
515 ::aos::ipc_lib::Sender *s = memory_->GetSender(sender_index_);
516
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800517 // Indicate that we are now alive by taking over the slot. If the previous
518 // owner died, we still want to do this.
519 death_notification_init(&(s->tid));
Austin Schuh20b2b082019-09-11 20:42:56 -0700520}
521
522LocklessQueue::Sender::~Sender() {
523 if (memory_ != nullptr) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800524 death_notification_release(&(memory_->GetSender(sender_index_)->tid));
Austin Schuh20b2b082019-09-11 20:42:56 -0700525 }
526}
527
528LocklessQueue::Sender LocklessQueue::MakeSender() {
529 return LocklessQueue::Sender(memory_);
530}
531
532QueueIndex ZeroOrValid(QueueIndex index) {
533 if (!index.valid()) {
534 return index.Clear();
535 }
536 return index;
537}
538
Alex Perrycb7da4b2019-08-28 19:35:56 -0700539size_t LocklessQueue::Sender::size() { return memory_->message_data_size(); }
540
541void *LocklessQueue::Sender::Data() {
542 ::aos::ipc_lib::Sender *sender = memory_->GetSender(sender_index_);
543 Index scratch_index = sender->scratch_index.RelaxedLoad();
544 Message *message = memory_->GetMessage(scratch_index);
545 message->header.queue_index.Invalidate();
546
547 return &message->data[0];
548}
549
Austin Schuh20b2b082019-09-11 20:42:56 -0700550void LocklessQueue::Sender::Send(const char *data, size_t length) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700551 CHECK_LE(length, size());
Austin Schuh67420a42019-12-21 21:55:04 -0800552 // Flatbuffers write from the back of the buffer to the front. If we are
553 // going to write an explicit chunk of memory into the buffer, we need to
554 // adhere to this convention and place it at the end.
555 memcpy((reinterpret_cast<char *>(Data()) + size() - length), data, length);
Alex Perrycb7da4b2019-08-28 19:35:56 -0700556 Send(length);
557}
558
559void LocklessQueue::Sender::Send(size_t length) {
Austin Schuh20b2b082019-09-11 20:42:56 -0700560 const size_t queue_size = memory_->queue_size();
Alex Perrycb7da4b2019-08-28 19:35:56 -0700561 CHECK_LE(length, size());
Austin Schuh20b2b082019-09-11 20:42:56 -0700562
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800563 ::aos::ipc_lib::Sender *const sender = memory_->GetSender(sender_index_);
564 // We can do a relaxed load on our sender because we're the only person
565 // modifying it right now.
566 const Index scratch_index = sender->scratch_index.RelaxedLoad();
567 Message *const message = memory_->GetMessage(scratch_index);
Austin Schuh20b2b082019-09-11 20:42:56 -0700568
Austin Schuh20b2b082019-09-11 20:42:56 -0700569 message->header.length = length;
Austin Schuh20b2b082019-09-11 20:42:56 -0700570
571 while (true) {
572 const QueueIndex actual_next_queue_index =
573 memory_->next_queue_index.Load(queue_size);
574 const QueueIndex next_queue_index = ZeroOrValid(actual_next_queue_index);
575
576 const QueueIndex incremented_queue_index = next_queue_index.Increment();
577
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800578 // This needs to synchronize with whoever the previous writer at this
579 // location was.
Austin Schuh20b2b082019-09-11 20:42:56 -0700580 const Index to_replace = memory_->LoadIndex(next_queue_index);
581
582 const QueueIndex decremented_queue_index =
583 next_queue_index.DecrementBy(queue_size);
584
585 // See if we got beat. If we did, try to atomically update
586 // next_queue_index in case the previous writer failed and retry.
587 if (!to_replace.IsPlausible(decremented_queue_index)) {
588 // We don't care about the result. It will either succeed, or we got
589 // beat in fixing it and just need to give up and try again. If we got
590 // beat multiple times, the only way progress can be made is if the queue
591 // is updated as well. This means that if we retry reading
592 // next_queue_index, we will be at most off by one and can retry.
593 //
594 // Both require no further action from us.
595 //
596 // TODO(austin): If we are having fairness issues under contention, we
597 // could have a mode bit in next_queue_index, and could use a lock or some
598 // other form of PI boosting to let the higher priority task win.
599 memory_->next_queue_index.CompareAndExchangeStrong(
600 actual_next_queue_index, incremented_queue_index);
601
Alex Perrycb7da4b2019-08-28 19:35:56 -0700602 VLOG(3) << "We were beat. Try again. Was " << std::hex
603 << to_replace.get() << ", is " << decremented_queue_index.index();
Austin Schuh20b2b082019-09-11 20:42:56 -0700604 continue;
605 }
606
607 // Confirm that the message is what it should be.
608 {
Austin Schuh20b2b082019-09-11 20:42:56 -0700609 const QueueIndex previous_index =
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800610 memory_->GetMessage(to_replace)->header.queue_index.Load(queue_size);
Austin Schuh20b2b082019-09-11 20:42:56 -0700611 if (previous_index != decremented_queue_index && previous_index.valid()) {
612 // Retry.
Alex Perrycb7da4b2019-08-28 19:35:56 -0700613 VLOG(3) << "Something fishy happened, queue index doesn't match. "
614 "Retrying. Previous index was "
615 << std::hex << previous_index.index() << ", should be "
616 << decremented_queue_index.index();
Austin Schuh20b2b082019-09-11 20:42:56 -0700617 continue;
618 }
619 }
620
621 message->header.monotonic_sent_time = ::aos::monotonic_clock::now();
622 message->header.realtime_sent_time = ::aos::realtime_clock::now();
623
624 // Before we are fully done filling out the message, update the Sender state
625 // with the new index to write. This re-uses the barrier for the
626 // queue_index store.
Alex Perrycb7da4b2019-08-28 19:35:56 -0700627 const Index index_to_write(next_queue_index, scratch_index.message_index());
Austin Schuh20b2b082019-09-11 20:42:56 -0700628
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800629 aos_compiler_memory_barrier();
630 // We're the only person who cares about our scratch index, besides somebody
631 // cleaning up after us.
Austin Schuh20b2b082019-09-11 20:42:56 -0700632 sender->scratch_index.RelaxedStore(index_to_write);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800633 aos_compiler_memory_barrier();
Austin Schuh20b2b082019-09-11 20:42:56 -0700634
635 message->header.queue_index.Store(next_queue_index);
636
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800637 aos_compiler_memory_barrier();
Austin Schuh20b2b082019-09-11 20:42:56 -0700638 // The message is now filled out, and we have a confirmed slot to store
639 // into.
640 //
641 // Start by writing down what we are going to pull out of the queue. This
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800642 // was Invalid before now. Only person who will read this is whoever cleans
643 // up after us, so no synchronization necessary.
Austin Schuh20b2b082019-09-11 20:42:56 -0700644 sender->to_replace.RelaxedStore(to_replace);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800645 aos_compiler_memory_barrier();
Austin Schuh20b2b082019-09-11 20:42:56 -0700646
647 // Then exchange the next index into the queue.
648 if (!memory_->GetQueue(next_queue_index.Wrapped())
649 ->CompareAndExchangeStrong(to_replace, index_to_write)) {
650 // Aw, didn't succeed. Retry.
651 sender->to_replace.RelaxedInvalidate();
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800652 aos_compiler_memory_barrier();
Alex Perrycb7da4b2019-08-28 19:35:56 -0700653 VLOG(3) << "Failed to wrap into queue";
Austin Schuh20b2b082019-09-11 20:42:56 -0700654 continue;
655 }
656
657 // Then update next_queue_index to save the next user some computation time.
658 memory_->next_queue_index.CompareAndExchangeStrong(actual_next_queue_index,
659 incremented_queue_index);
660
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800661 aos_compiler_memory_barrier();
Austin Schuh20b2b082019-09-11 20:42:56 -0700662 // Now update the scratch space and record that we succeeded.
663 sender->scratch_index.Store(to_replace);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800664 aos_compiler_memory_barrier();
665 // And then record that we succeeded, but definitely after the above store.
Austin Schuh20b2b082019-09-11 20:42:56 -0700666 sender->to_replace.RelaxedInvalidate();
667 break;
668 }
669}
670
671LocklessQueue::ReadResult LocklessQueue::Read(
672 uint32_t uint32_queue_index,
673 ::aos::monotonic_clock::time_point *monotonic_sent_time,
674 ::aos::realtime_clock::time_point *realtime_sent_time, size_t *length,
675 char *data) {
676 const size_t queue_size = memory_->queue_size();
677
678 // Build up the QueueIndex.
679 const QueueIndex queue_index =
680 QueueIndex::Zero(queue_size).IncrementBy(uint32_queue_index);
681
682 // Read the message stored at the requested location.
683 Index mi = memory_->LoadIndex(queue_index);
684 Message *m = memory_->GetMessage(mi);
685
686 while (true) {
687 // We need to confirm that the data doesn't change while we are reading it.
688 // Do that by first confirming that the message points to the queue index we
689 // want.
690 const QueueIndex starting_queue_index =
691 m->header.queue_index.Load(queue_size);
692 if (starting_queue_index != queue_index) {
693 // If we found a message that is exactly 1 loop old, we just wrapped.
694 if (starting_queue_index == queue_index.DecrementBy(queue_size)) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700695 VLOG(3) << "Matches: " << std::hex << starting_queue_index.index()
696 << ", " << queue_index.DecrementBy(queue_size).index();
Austin Schuh20b2b082019-09-11 20:42:56 -0700697 return ReadResult::NOTHING_NEW;
698 } else {
699 // Someone has re-used this message between when we pulled it out of the
700 // queue and when we grabbed its index. It is pretty hard to deduce
701 // what happened. Just try again.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800702 Message *const new_m = memory_->GetMessage(queue_index);
Austin Schuh20b2b082019-09-11 20:42:56 -0700703 if (m != new_m) {
704 m = new_m;
Alex Perrycb7da4b2019-08-28 19:35:56 -0700705 VLOG(3) << "Retrying, m doesn't match";
Austin Schuh20b2b082019-09-11 20:42:56 -0700706 continue;
707 }
708
709 // We have confirmed that message still points to the same message. This
710 // means that the message didn't get swapped out from under us, so
711 // starting_queue_index is correct.
712 //
713 // Either we got too far behind (signaled by this being a valid
714 // message), or this is one of the initial messages which are invalid.
715 if (starting_queue_index.valid()) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700716 VLOG(3) << "Too old. Tried for " << std::hex << queue_index.index()
717 << ", got " << starting_queue_index.index() << ", behind by "
718 << std::dec
719 << (starting_queue_index.index() - queue_index.index());
Austin Schuh20b2b082019-09-11 20:42:56 -0700720 return ReadResult::TOO_OLD;
721 }
722
Alex Perrycb7da4b2019-08-28 19:35:56 -0700723 VLOG(3) << "Initial";
Austin Schuh20b2b082019-09-11 20:42:56 -0700724
725 // There isn't a valid message at this location.
726 //
727 // If someone asks for one of the messages within the first go around,
728 // then they need to wait. They got ahead. Otherwise, they are
729 // asking for something crazy, like something before the beginning of
730 // the queue. Tell them that they are behind.
731 if (uint32_queue_index < memory_->queue_size()) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700732 VLOG(3) << "Near zero, " << std::hex << uint32_queue_index;
Austin Schuh20b2b082019-09-11 20:42:56 -0700733 return ReadResult::NOTHING_NEW;
734 } else {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800735 VLOG(3) << "Not near zero, " << std::hex << uint32_queue_index;
Austin Schuh20b2b082019-09-11 20:42:56 -0700736 return ReadResult::TOO_OLD;
737 }
738 }
739 }
Alex Perrycb7da4b2019-08-28 19:35:56 -0700740 VLOG(3) << "Eq: " << std::hex << starting_queue_index.index() << ", "
741 << queue_index.index();
Austin Schuh20b2b082019-09-11 20:42:56 -0700742 break;
743 }
744
Alex Perrycb7da4b2019-08-28 19:35:56 -0700745 // Then read the data out. Copy it all out to be deterministic and so we can
746 // make length be from either end.
Austin Schuh20b2b082019-09-11 20:42:56 -0700747 *monotonic_sent_time = m->header.monotonic_sent_time;
748 *realtime_sent_time = m->header.realtime_sent_time;
Alex Perrycb7da4b2019-08-28 19:35:56 -0700749 memcpy(data, &m->data[0], message_data_size());
Austin Schuh20b2b082019-09-11 20:42:56 -0700750 *length = m->header.length;
751
752 // And finally, confirm that the message *still* points to the queue index we
753 // want. This means it didn't change out from under us.
754 // If something changed out from under us, we were reading it much too late in
755 // it's lifetime.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800756 aos_compiler_memory_barrier();
Austin Schuh20b2b082019-09-11 20:42:56 -0700757 const QueueIndex final_queue_index = m->header.queue_index.Load(queue_size);
758 if (final_queue_index != queue_index) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700759 VLOG(3) << "Changed out from under us. Reading " << std::hex
760 << queue_index.index() << ", finished with "
761 << final_queue_index.index() << ", delta: " << std::dec
762 << (final_queue_index.index() - queue_index.index());
763 return ReadResult::OVERWROTE;
Austin Schuh20b2b082019-09-11 20:42:56 -0700764 }
765
766 return ReadResult::GOOD;
767}
768
Alex Perrycb7da4b2019-08-28 19:35:56 -0700769size_t LocklessQueue::queue_size() const { return memory_->queue_size(); }
770size_t LocklessQueue::message_data_size() const {
771 return memory_->message_data_size();
772}
773
774QueueIndex LocklessQueue::LatestQueueIndex() {
Austin Schuh20b2b082019-09-11 20:42:56 -0700775 const size_t queue_size = memory_->queue_size();
776
777 // There is only one interesting case. We need to know if the queue is empty.
778 // That is done with a sentinel value. At worst, this will be off by one.
779 const QueueIndex next_queue_index =
780 memory_->next_queue_index.Load(queue_size);
781 if (next_queue_index.valid()) {
782 const QueueIndex current_queue_index = next_queue_index.DecrementBy(1u);
Alex Perrycb7da4b2019-08-28 19:35:56 -0700783 return current_queue_index;
Austin Schuh20b2b082019-09-11 20:42:56 -0700784 } else {
785 return empty_queue_index();
786 }
787}
788
789namespace {
790
791// Prints out the mutex state. Not safe to use while the mutex is being
792// changed.
793::std::string PrintMutex(aos_mutex *mutex) {
794 ::std::stringstream s;
795 s << "aos_mutex(" << ::std::hex << mutex->futex;
796
797 if (mutex->futex != 0) {
798 s << ":";
799 if (mutex->futex & FUTEX_OWNER_DIED) {
800 s << "FUTEX_OWNER_DIED|";
801 }
802 s << "tid=" << (mutex->futex & FUTEX_TID_MASK);
803 }
804
805 s << ")";
806 return s.str();
807}
808
809} // namespace
810
811void PrintLocklessQueueMemory(LocklessQueueMemory *memory) {
812 const size_t queue_size = memory->queue_size();
813 ::std::cout << "LocklessQueueMemory (" << memory << ") {" << ::std::endl;
814 ::std::cout << " aos_mutex queue_setup_lock = "
815 << PrintMutex(&memory->queue_setup_lock) << ::std::endl;
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800816 ::std::cout << " bool initialized = " << memory->initialized << ::std::endl;
Austin Schuh20b2b082019-09-11 20:42:56 -0700817 ::std::cout << " config {" << ::std::endl;
818 ::std::cout << " size_t num_watchers = " << memory->config.num_watchers
819 << ::std::endl;
820 ::std::cout << " size_t num_senders = " << memory->config.num_senders
821 << ::std::endl;
822 ::std::cout << " size_t queue_size = " << memory->config.queue_size
823 << ::std::endl;
824 ::std::cout << " size_t message_data_size = "
825 << memory->config.message_data_size << ::std::endl;
826
827 ::std::cout << " AtomicQueueIndex next_queue_index = "
828 << memory->next_queue_index.Load(queue_size).DebugString()
829 << ::std::endl;
830
831 ::std::cout << " }" << ::std::endl;
832 ::std::cout << " AtomicIndex queue[" << queue_size << "] {" << ::std::endl;
833 for (size_t i = 0; i < queue_size; ++i) {
834 ::std::cout << " [" << i << "] -> "
835 << memory->GetQueue(i)->Load().DebugString() << ::std::endl;
836 }
837 ::std::cout << " }" << ::std::endl;
838 ::std::cout << " Message messages[" << memory->num_messages() << "] {"
839 << ::std::endl;
840 for (size_t i = 0; i < memory->num_messages(); ++i) {
841 Message *m = memory->GetMessage(Index(i, i));
842 ::std::cout << " [" << i << "] -> Message {" << ::std::endl;
843 ::std::cout << " Header {" << ::std::endl;
844 ::std::cout << " AtomicQueueIndex queue_index = "
845 << m->header.queue_index.Load(queue_size).DebugString()
846 << ::std::endl;
847 ::std::cout << " size_t length = " << m->header.length
848 << ::std::endl;
849 ::std::cout << " }" << ::std::endl;
850 ::std::cout << " data: {";
851
852 for (size_t j = 0; j < m->header.length; ++j) {
853 char data = m->data[j];
854 if (j != 0) {
855 ::std::cout << " ";
856 }
857 if (::std::isprint(data)) {
858 ::std::cout << ::std::setfill(' ') << ::std::setw(2) << ::std::hex
859 << data;
860 } else {
861 ::std::cout << "0x" << ::std::setfill('0') << ::std::setw(2)
862 << ::std::hex << (static_cast<unsigned>(data) & 0xff);
863 }
864 }
865 ::std::cout << ::std::setfill(' ') << ::std::dec << "}" << ::std::endl;
866 ::std::cout << " }," << ::std::endl;
867 }
868 ::std::cout << " }" << ::std::endl;
869
Alex Perrycb7da4b2019-08-28 19:35:56 -0700870 ::std::cout << " Sender senders[" << memory->num_senders() << "] {"
871 << ::std::endl;
Austin Schuh20b2b082019-09-11 20:42:56 -0700872 for (size_t i = 0; i < memory->num_senders(); ++i) {
873 Sender *s = memory->GetSender(i);
874 ::std::cout << " [" << i << "] -> Sender {" << ::std::endl;
875 ::std::cout << " aos_mutex tid = " << PrintMutex(&s->tid)
876 << ::std::endl;
877 ::std::cout << " AtomicIndex scratch_index = "
878 << s->scratch_index.Load().DebugString() << ::std::endl;
879 ::std::cout << " AtomicIndex to_replace = "
880 << s->to_replace.Load().DebugString() << ::std::endl;
881 ::std::cout << " }" << ::std::endl;
882 }
883 ::std::cout << " }" << ::std::endl;
884
885 ::std::cout << " Watcher watchers[" << memory->num_watchers() << "] {"
886 << ::std::endl;
887 for (size_t i = 0; i < memory->num_watchers(); ++i) {
888 Watcher *w = memory->GetWatcher(i);
889 ::std::cout << " [" << i << "] -> Watcher {" << ::std::endl;
890 ::std::cout << " aos_mutex tid = " << PrintMutex(&w->tid)
891 << ::std::endl;
892 ::std::cout << " pid_t pid = " << w->pid << ::std::endl;
893 ::std::cout << " int priority = " << w->priority << ::std::endl;
894 ::std::cout << " }" << ::std::endl;
895 }
896 ::std::cout << " }" << ::std::endl;
897
898 ::std::cout << "}" << ::std::endl;
899}
900
901} // namespace ipc_lib
902} // namespace aos