blob: 78f990d833dd69a1c40f95f59011bee8238f0594 [file] [log] [blame]
Austin Schuh20b2b082019-09-11 20:42:56 -07001#include "aos/ipc_lib/lockless_queue.h"
2
3#include <linux/futex.h>
4#include <sys/types.h>
5#include <syscall.h>
6#include <unistd.h>
7#include <algorithm>
8#include <iomanip>
9#include <iostream>
10#include <sstream>
11
Austin Schuh20b2b082019-09-11 20:42:56 -070012#include "aos/ipc_lib/lockless_queue_memory.h"
Alex Perrycb7da4b2019-08-28 19:35:56 -070013#include "aos/realtime.h"
Austin Schuh20b2b082019-09-11 20:42:56 -070014#include "aos/util/compiler_memory_barrier.h"
Austin Schuhf257f3c2019-10-27 21:00:43 -070015#include "glog/logging.h"
Austin Schuh20b2b082019-09-11 20:42:56 -070016
17namespace aos {
18namespace ipc_lib {
Austin Schuh20b2b082019-09-11 20:42:56 -070019namespace {
20
Brian Silvermanfafe1fa2019-12-18 21:42:18 -080021class GrabQueueSetupLockOrDie {
22 public:
23 GrabQueueSetupLockOrDie(LocklessQueueMemory *memory) : memory_(memory) {
24 const int result = mutex_grab(&(memory->queue_setup_lock));
25 CHECK(result == 0 || result == 1) << ": " << result;
26 }
Austin Schuh20b2b082019-09-11 20:42:56 -070027
Brian Silvermanfafe1fa2019-12-18 21:42:18 -080028 ~GrabQueueSetupLockOrDie() { mutex_unlock(&(memory_->queue_setup_lock)); }
29
30 GrabQueueSetupLockOrDie(const GrabQueueSetupLockOrDie &) = delete;
31 GrabQueueSetupLockOrDie &operator=(const GrabQueueSetupLockOrDie &) = delete;
32
33 private:
34 LocklessQueueMemory *const memory_;
35};
36
37void Cleanup(LocklessQueueMemory *memory, const GrabQueueSetupLockOrDie &) {
38 // Make sure we start looking at shared memory fresh right now. We'll handle
39 // people dying partway through by either cleaning up after them or not, but
40 // we want to ensure we clean up after anybody who has already died when we
41 // start.
42 aos_compiler_memory_barrier();
43
Austin Schuh20b2b082019-09-11 20:42:56 -070044 const size_t num_senders = memory->num_senders();
45 const size_t queue_size = memory->queue_size();
46 const size_t num_messages = memory->num_messages();
47
48 // There are a large number of crazy cases here for how things can go wrong
49 // and how we have to recover. They either require us to keep extra track of
50 // what is going on, slowing down the send path, or require a large number of
51 // cases.
52 //
53 // The solution here is to not over-think it. This is running while not real
54 // time during construction. It is allowed to be slow. It will also very
55 // rarely trigger. There is a small uS window where process death is
56 // ambiguous.
57 //
58 // So, build up a list N long, where N is the number of messages. Search
59 // through the entire queue and the sender list (ignoring any dead senders),
60 // and mark down which ones we have seen. Once we have seen all the messages
61 // except the N dead senders, we know which messages are dead. Because the
62 // queue is active while we do this, it may take a couple of go arounds to see
63 // everything.
64
65 // Do the easy case. Find all senders who have died. See if they are either
66 // consistent already, or if they have copied over to_replace to the scratch
67 // index, but haven't cleared to_replace. Count them.
68 size_t valid_senders = 0;
69 for (size_t i = 0; i < num_senders; ++i) {
70 Sender *sender = memory->GetSender(i);
71 const uint32_t tid =
Brian Silvermanfafe1fa2019-12-18 21:42:18 -080072 __atomic_load_n(&(sender->tid.futex), __ATOMIC_ACQUIRE);
Austin Schuh20b2b082019-09-11 20:42:56 -070073 if (tid & FUTEX_OWNER_DIED) {
Alex Perrycb7da4b2019-08-28 19:35:56 -070074 VLOG(3) << "Found an easy death for sender " << i;
Brian Silvermanfafe1fa2019-12-18 21:42:18 -080075 // We can do a relaxed load here because we're the only person touching
76 // this sender at this point.
Austin Schuh20b2b082019-09-11 20:42:56 -070077 const Index to_replace = sender->to_replace.RelaxedLoad();
78 const Index scratch_index = sender->scratch_index.Load();
79
80 // I find it easiest to think about this in terms of the set of observable
Brian Silvermanfafe1fa2019-12-18 21:42:18 -080081 // states. The main code progresses through the following states:
Austin Schuh20b2b082019-09-11 20:42:56 -070082
83 // 1) scratch_index = xxx
84 // to_replace = invalid
85 // This is unambiguous. Already good.
86
87 // 2) scratch_index = xxx
88 // to_replace = yyy
89 // Very ambiguous. Is xxx or yyy the correct one? Need to either roll
90 // this forwards or backwards.
91
92 // 3) scratch_index = yyy
93 // to_replace = yyy
94 // We are in the act of moving to_replace to scratch_index, but didn't
95 // finish. Easy.
96
97 // 4) scratch_index = yyy
98 // to_replace = invalid
99 // Finished, but died. Looks like 1)
100
101 // Any cleanup code needs to follow the same set of states to be robust to
102 // death, so death can be restarted.
103
104 // Could be 2) or 3).
105 if (to_replace.valid()) {
106 // 3)
107 if (to_replace == scratch_index) {
108 // Just need to invalidate to_replace to finish.
109 sender->to_replace.Invalidate();
110
111 // And mark that we succeeded.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800112 __atomic_store_n(&(sender->tid.futex), 0, __ATOMIC_RELEASE);
Austin Schuh20b2b082019-09-11 20:42:56 -0700113 ++valid_senders;
114 }
115 } else {
116 // 1) or 4). Make sure we aren't corrupted and declare victory.
117 CHECK(scratch_index.valid());
118
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800119 __atomic_store_n(&(sender->tid.futex), 0, __ATOMIC_RELEASE);
Austin Schuh20b2b082019-09-11 20:42:56 -0700120 ++valid_senders;
121 }
122 } else {
123 // Not dead.
124 ++valid_senders;
125 }
126 }
127
128 // If all the senders are (or were made) good, there is no need to do the hard
129 // case.
130 if (valid_senders == num_senders) {
131 return;
132 }
133
Alex Perrycb7da4b2019-08-28 19:35:56 -0700134 VLOG(3) << "Starting hard cleanup";
Austin Schuh20b2b082019-09-11 20:42:56 -0700135
136 size_t num_accounted_for = 0;
137 size_t num_missing = 0;
138 ::std::vector<bool> accounted_for(num_messages, false);
139
140 while ((num_accounted_for + num_missing) != num_messages) {
141 num_missing = 0;
142 for (size_t i = 0; i < num_senders; ++i) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800143 Sender *const sender = memory->GetSender(i);
Austin Schuh20b2b082019-09-11 20:42:56 -0700144 const uint32_t tid =
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800145 __atomic_load_n(&(sender->tid.futex), __ATOMIC_ACQUIRE);
Austin Schuh20b2b082019-09-11 20:42:56 -0700146 if (tid & FUTEX_OWNER_DIED) {
147 ++num_missing;
148 } else {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800149 // We can do a relaxed load here because we're the only person touching
150 // this sender at this point, if it matters. If it's not a dead sender,
151 // then any message it every has will already be accounted for, so this
152 // will always be a NOP.
Austin Schuh20b2b082019-09-11 20:42:56 -0700153 const Index scratch_index = sender->scratch_index.RelaxedLoad();
154 if (!accounted_for[scratch_index.message_index()]) {
155 ++num_accounted_for;
156 }
157 accounted_for[scratch_index.message_index()] = true;
158 }
159 }
160
161 for (size_t i = 0; i < queue_size; ++i) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800162 // Same logic as above for scratch_index applies here too.
Austin Schuh20b2b082019-09-11 20:42:56 -0700163 const Index index = memory->GetQueue(i)->RelaxedLoad();
164 if (!accounted_for[index.message_index()]) {
165 ++num_accounted_for;
166 }
167 accounted_for[index.message_index()] = true;
168 }
169 }
170
171 while (num_missing != 0) {
172 const size_t starting_num_missing = num_missing;
173 for (size_t i = 0; i < num_senders; ++i) {
174 Sender *sender = memory->GetSender(i);
175 const uint32_t tid =
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800176 __atomic_load_n(&(sender->tid.futex), __ATOMIC_ACQUIRE);
Austin Schuh20b2b082019-09-11 20:42:56 -0700177 if (tid & FUTEX_OWNER_DIED) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800178 // We can do relaxed loads here because we're the only person touching
179 // this sender at this point.
Austin Schuh20b2b082019-09-11 20:42:56 -0700180 const Index scratch_index = sender->scratch_index.RelaxedLoad();
181 const Index to_replace = sender->to_replace.RelaxedLoad();
182
183 // Candidate.
184 CHECK_LE(to_replace.message_index(), accounted_for.size());
185 if (accounted_for[to_replace.message_index()]) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700186 VLOG(3) << "Sender " << i
187 << " died, to_replace is already accounted for";
Austin Schuh20b2b082019-09-11 20:42:56 -0700188 // If both are accounted for, we are corrupt...
189 CHECK(!accounted_for[scratch_index.message_index()]);
190
191 // to_replace is already accounted for. This means that we didn't
192 // atomically insert scratch_index into the queue yet. So
193 // invalidate to_replace.
194 sender->to_replace.Invalidate();
195
196 // And then mark this sender clean.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800197 __atomic_store_n(&(sender->tid.futex), 0, __ATOMIC_RELEASE);
Austin Schuh20b2b082019-09-11 20:42:56 -0700198
199 // And account for scratch_index.
200 accounted_for[scratch_index.message_index()] = true;
201 --num_missing;
202 ++num_accounted_for;
203 } else if (accounted_for[scratch_index.message_index()]) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700204 VLOG(3) << "Sender " << i
205 << " died, scratch_index is already accounted for";
Austin Schuh20b2b082019-09-11 20:42:56 -0700206 // scratch_index is accounted for. That means we did the insert,
207 // but didn't record it.
208 CHECK(to_replace.valid());
209 // Finish the transaction. Copy to_replace, then clear it.
210
211 sender->scratch_index.Store(to_replace);
212 sender->to_replace.Invalidate();
213
214 // And then mark this sender clean.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800215 __atomic_store_n(&(sender->tid.futex), 0, __ATOMIC_RELEASE);
Austin Schuh20b2b082019-09-11 20:42:56 -0700216
217 // And account for to_replace.
218 accounted_for[to_replace.message_index()] = true;
219 --num_missing;
220 ++num_accounted_for;
221 } else {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700222 VLOG(3) << "Sender " << i << " died, neither is accounted for";
Austin Schuh20b2b082019-09-11 20:42:56 -0700223 // Ambiguous. There will be an unambiguous one somewhere that we
224 // can do first.
225 }
226 }
227 }
228 // CHECK that we are making progress.
229 CHECK_NE(num_missing, starting_num_missing);
230 }
231}
232
233// Exposes rt_tgsigqueueinfo so we can send the signal *just* to the target
234// thread.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800235// TODO(Brian): Do directly in assembly for armhf at least for efficiency.
Austin Schuh20b2b082019-09-11 20:42:56 -0700236int rt_tgsigqueueinfo(pid_t tgid, pid_t tid, int sig, siginfo_t *si) {
237 return syscall(SYS_rt_tgsigqueueinfo, tgid, tid, sig, si);
238}
239
240} // namespace
241
242size_t LocklessQueueMemorySize(LocklessQueueConfiguration config) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800243 // Round up the message size so following data is aligned appropriately.
244 config.message_data_size =
245 LocklessQueueMemory::AlignmentRoundUp(config.message_data_size);
Austin Schuh20b2b082019-09-11 20:42:56 -0700246
247 // As we build up the size, confirm that everything is aligned to the
248 // alignment requirements of the type.
249 size_t size = sizeof(LocklessQueueMemory);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800250 CHECK_EQ(size % alignof(LocklessQueueMemory), 0u);
Austin Schuh20b2b082019-09-11 20:42:56 -0700251
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800252 CHECK_EQ(size % alignof(AtomicIndex), 0u);
Austin Schuh20b2b082019-09-11 20:42:56 -0700253 size += LocklessQueueMemory::SizeOfQueue(config);
254
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800255 CHECK_EQ(size % alignof(Message), 0u);
Austin Schuh20b2b082019-09-11 20:42:56 -0700256 size += LocklessQueueMemory::SizeOfMessages(config);
257
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800258 CHECK_EQ(size % alignof(Watcher), 0u);
Austin Schuh20b2b082019-09-11 20:42:56 -0700259 size += LocklessQueueMemory::SizeOfWatchers(config);
260
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800261 CHECK_EQ(size % alignof(Sender), 0u);
Austin Schuh20b2b082019-09-11 20:42:56 -0700262 size += LocklessQueueMemory::SizeOfSenders(config);
263
264 return size;
265}
266
267LocklessQueueMemory *InitializeLocklessQueueMemory(
268 LocklessQueueMemory *memory, LocklessQueueConfiguration config) {
269 // Everything should be zero initialized already. So we just need to fill
270 // everything out properly.
271
272 // Grab the mutex. We don't care if the previous reader died. We are going
273 // to check everything anyways.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800274 GrabQueueSetupLockOrDie grab_queue_setup_lock(memory);
Austin Schuh20b2b082019-09-11 20:42:56 -0700275
276 if (!memory->initialized) {
277 // TODO(austin): Check these for out of bounds.
278 memory->config.num_watchers = config.num_watchers;
279 memory->config.num_senders = config.num_senders;
280 memory->config.queue_size = config.queue_size;
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800281 memory->config.message_data_size =
282 LocklessQueueMemory::AlignmentRoundUp(config.message_data_size);
Austin Schuh20b2b082019-09-11 20:42:56 -0700283
284 const size_t num_messages = memory->num_messages();
285 // There need to be at most MaxMessages() messages allocated.
286 CHECK_LE(num_messages, Index::MaxMessages());
287
288 for (size_t i = 0; i < num_messages; ++i) {
289 memory->GetMessage(Index(QueueIndex::Zero(memory->queue_size()), i))
290 ->header.queue_index.Invalidate();
291 }
292
293 for (size_t i = 0; i < memory->queue_size(); ++i) {
294 // Make the initial counter be the furthest away number. That means that
295 // index 0 should be 0xffff, 1 should be 0, etc.
296 memory->GetQueue(i)->Store(Index(QueueIndex::Zero(memory->queue_size())
297 .IncrementBy(i)
298 .DecrementBy(memory->queue_size()),
299 i));
300 }
301
302 memory->next_queue_index.Invalidate();
303
304 for (size_t i = 0; i < memory->num_senders(); ++i) {
305 ::aos::ipc_lib::Sender *s = memory->GetSender(i);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800306 // Nobody else can possibly be touching these because we haven't set
307 // initialized to true yet.
308 s->scratch_index.RelaxedStore(Index(0xffff, i + memory->queue_size()));
Austin Schuh20b2b082019-09-11 20:42:56 -0700309 s->to_replace.RelaxedInvalidate();
310 }
311
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800312 aos_compiler_memory_barrier();
Austin Schuh20b2b082019-09-11 20:42:56 -0700313 // Signal everything is done. This needs to be done last, so if we die, we
314 // redo initialization.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800315 memory->initialized = true;
Austin Schuh20b2b082019-09-11 20:42:56 -0700316 }
317
Austin Schuh20b2b082019-09-11 20:42:56 -0700318 return memory;
319}
320
321LocklessQueue::LocklessQueue(LocklessQueueMemory *memory,
322 LocklessQueueConfiguration config)
323 : memory_(InitializeLocklessQueueMemory(memory, config)),
324 watcher_copy_(memory_->num_watchers()),
325 pid_(getpid()),
326 uid_(getuid()) {}
327
328LocklessQueue::~LocklessQueue() {
329 CHECK_EQ(watcher_index_, -1);
330
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800331 GrabQueueSetupLockOrDie grab_queue_setup_lock(memory_);
Austin Schuh20b2b082019-09-11 20:42:56 -0700332 const int num_watchers = memory_->num_watchers();
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800333 // Cleanup is cheap. The next user will do it anyways, so no need for us to do
334 // anything right now.
Austin Schuh20b2b082019-09-11 20:42:56 -0700335
336 // And confirm that nothing is owned by us.
337 for (int i = 0; i < num_watchers; ++i) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800338 CHECK(!death_notification_is_held(&(memory_->GetWatcher(i)->tid)));
Austin Schuh20b2b082019-09-11 20:42:56 -0700339 }
Austin Schuh20b2b082019-09-11 20:42:56 -0700340}
341
342size_t LocklessQueue::QueueSize() const { return memory_->queue_size(); }
343
344bool LocklessQueue::RegisterWakeup(int priority) {
345 // TODO(austin): Make sure signal coalescing is turned on. We don't need
346 // duplicates. That will improve performance under high load.
347
348 // Since everything is self consistent, all we need to do is make sure nobody
349 // else is running. Someone dying will get caught in the generic consistency
350 // check.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800351 GrabQueueSetupLockOrDie grab_queue_setup_lock(memory_);
Austin Schuh20b2b082019-09-11 20:42:56 -0700352 const int num_watchers = memory_->num_watchers();
353
354 // Now, find the first empty watcher and grab it.
355 CHECK_EQ(watcher_index_, -1);
356 for (int i = 0; i < num_watchers; ++i) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800357 // If we see a slot the kernel has marked as dead, everything we do reusing
358 // it needs to happen-after whatever that process did before dying.
Austin Schuh20b2b082019-09-11 20:42:56 -0700359 const uint32_t tid =
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800360 __atomic_load_n(&(memory_->GetWatcher(i)->tid.futex), __ATOMIC_ACQUIRE);
361 if (tid == 0 || (tid & FUTEX_OWNER_DIED)) {
Austin Schuh20b2b082019-09-11 20:42:56 -0700362 watcher_index_ = i;
363 break;
364 }
365 }
366
367 // Bail if we failed to find an open slot.
368 if (watcher_index_ == -1) {
Austin Schuh20b2b082019-09-11 20:42:56 -0700369 return false;
370 }
371
372 Watcher *w = memory_->GetWatcher(watcher_index_);
373
374 w->pid = getpid();
375 w->priority = priority;
376
377 // Grabbing a mutex is a compiler and memory barrier, so nothing before will
378 // get rearranged afterwords.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800379 death_notification_init(&(w->tid));
380 return true;
Austin Schuh20b2b082019-09-11 20:42:56 -0700381}
382
383void LocklessQueue::UnregisterWakeup() {
384 // Since everything is self consistent, all we need to do is make sure nobody
385 // else is running. Someone dying will get caught in the generic consistency
386 // check.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800387 GrabQueueSetupLockOrDie grab_queue_setup_lock(memory_);
Austin Schuh20b2b082019-09-11 20:42:56 -0700388
389 // Make sure we are registered.
390 CHECK_NE(watcher_index_, -1);
391
392 // Make sure we still own the slot we are supposed to.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800393 CHECK(
394 death_notification_is_held(&(memory_->GetWatcher(watcher_index_)->tid)));
Austin Schuh20b2b082019-09-11 20:42:56 -0700395
396 // The act of unlocking invalidates the entry. Invalidate it.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800397 death_notification_release(&(memory_->GetWatcher(watcher_index_)->tid));
Austin Schuh20b2b082019-09-11 20:42:56 -0700398 // And internally forget the slot.
399 watcher_index_ = -1;
Austin Schuh20b2b082019-09-11 20:42:56 -0700400}
401
402int LocklessQueue::Wakeup(const int current_priority) {
403 const size_t num_watchers = memory_->num_watchers();
404
405 CHECK_EQ(watcher_copy_.size(), num_watchers);
406
407 // Grab a copy so it won't change out from underneath us, and we can sort it
408 // nicely in C++.
409 // Do note that there is still a window where the process can die *after* we
410 // read everything. We will still PI boost and send a signal to the thread in
411 // question. There is no way without pidfd's to close this window, and
412 // creating a pidfd is likely not RT.
413 for (size_t i = 0; i < num_watchers; ++i) {
414 Watcher *w = memory_->GetWatcher(i);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800415 watcher_copy_[i].tid = __atomic_load_n(&(w->tid.futex), __ATOMIC_RELAXED);
416 // Force the load of the TID to come first.
417 aos_compiler_memory_barrier();
418 watcher_copy_[i].pid = w->pid.load(std::memory_order_relaxed);
419 watcher_copy_[i].priority = w->priority.load(std::memory_order_relaxed);
Austin Schuh20b2b082019-09-11 20:42:56 -0700420
421 // Use a priority of -1 to mean an invalid entry to make sorting easier.
422 if (watcher_copy_[i].tid & FUTEX_OWNER_DIED || watcher_copy_[i].tid == 0) {
423 watcher_copy_[i].priority = -1;
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800424 } else {
425 // Ensure all of this happens after we're done looking at the pid+priority
426 // in shared memory.
427 aos_compiler_memory_barrier();
428 if (watcher_copy_[i].tid != static_cast<pid_t>(__atomic_load_n(
429 &(w->tid.futex), __ATOMIC_RELAXED))) {
430 // Confirm that the watcher hasn't been re-used and modified while we
431 // read it. If it has, mark it invalid again.
432 watcher_copy_[i].priority = -1;
433 watcher_copy_[i].tid = 0;
434 }
Austin Schuh20b2b082019-09-11 20:42:56 -0700435 }
436 }
437
438 // Now sort.
439 ::std::sort(watcher_copy_.begin(), watcher_copy_.end(),
440 [](const WatcherCopy &a, const WatcherCopy &b) {
441 return a.priority > b.priority;
442 });
443
444 int count = 0;
445 if (watcher_copy_[0].priority != -1) {
446 const int max_priority =
447 ::std::max(current_priority, watcher_copy_[0].priority);
448 // Boost if we are RT and there is a higher priority sender out there.
449 // Otherwise we might run into priority inversions.
450 if (max_priority > current_priority && current_priority > 0) {
451 SetCurrentThreadRealtimePriority(max_priority);
452 }
453
454 // Build up the siginfo to send.
455 siginfo_t uinfo;
456 memset(&uinfo, 0, sizeof(uinfo));
457
458 uinfo.si_code = SI_QUEUE;
459 uinfo.si_pid = pid_;
460 uinfo.si_uid = uid_;
461 uinfo.si_value.sival_int = 0;
462
463 for (const WatcherCopy &watcher_copy : watcher_copy_) {
464 // The first -1 priority means we are at the end of the valid list.
465 if (watcher_copy.priority == -1) {
466 break;
467 }
468
469 // Send the signal. Target just the thread that sent it so that we can
470 // support multiple watchers in a process (when someone creates multiple
471 // event loops in different threads).
472 rt_tgsigqueueinfo(watcher_copy.pid, watcher_copy.tid, kWakeupSignal,
473 &uinfo);
474
475 ++count;
476 }
477
478 // Drop back down if we were boosted.
479 if (max_priority > current_priority && current_priority > 0) {
480 SetCurrentThreadRealtimePriority(current_priority);
481 }
482 }
483
484 return count;
485}
486
487LocklessQueue::Sender::Sender(LocklessQueueMemory *memory) : memory_(memory) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800488 GrabQueueSetupLockOrDie grab_queue_setup_lock(memory_);
Austin Schuh20b2b082019-09-11 20:42:56 -0700489
490 // Since we already have the lock, go ahead and try cleaning up.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800491 Cleanup(memory_, grab_queue_setup_lock);
Austin Schuh20b2b082019-09-11 20:42:56 -0700492
493 const int num_senders = memory_->num_senders();
494
495 for (int i = 0; i < num_senders; ++i) {
496 ::aos::ipc_lib::Sender *s = memory->GetSender(i);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800497 // This doesn't need synchronization because we're the only process doing
498 // initialization right now, and nobody else will be touching senders which
499 // we're interested in.
Austin Schuh20b2b082019-09-11 20:42:56 -0700500 const uint32_t tid = __atomic_load_n(&(s->tid.futex), __ATOMIC_RELAXED);
501 if (tid == 0) {
502 sender_index_ = i;
503 break;
504 }
505 }
506
507 if (sender_index_ == -1) {
Austin Schuhf257f3c2019-10-27 21:00:43 -0700508 LOG(FATAL) << "Too many senders";
Austin Schuh20b2b082019-09-11 20:42:56 -0700509 }
510
511 ::aos::ipc_lib::Sender *s = memory_->GetSender(sender_index_);
512
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800513 // Indicate that we are now alive by taking over the slot. If the previous
514 // owner died, we still want to do this.
515 death_notification_init(&(s->tid));
Austin Schuh20b2b082019-09-11 20:42:56 -0700516}
517
518LocklessQueue::Sender::~Sender() {
519 if (memory_ != nullptr) {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800520 death_notification_release(&(memory_->GetSender(sender_index_)->tid));
Austin Schuh20b2b082019-09-11 20:42:56 -0700521 }
522}
523
524LocklessQueue::Sender LocklessQueue::MakeSender() {
525 return LocklessQueue::Sender(memory_);
526}
527
528QueueIndex ZeroOrValid(QueueIndex index) {
529 if (!index.valid()) {
530 return index.Clear();
531 }
532 return index;
533}
534
Alex Perrycb7da4b2019-08-28 19:35:56 -0700535size_t LocklessQueue::Sender::size() { return memory_->message_data_size(); }
536
537void *LocklessQueue::Sender::Data() {
538 ::aos::ipc_lib::Sender *sender = memory_->GetSender(sender_index_);
539 Index scratch_index = sender->scratch_index.RelaxedLoad();
540 Message *message = memory_->GetMessage(scratch_index);
541 message->header.queue_index.Invalidate();
542
543 return &message->data[0];
544}
545
Austin Schuh20b2b082019-09-11 20:42:56 -0700546void LocklessQueue::Sender::Send(const char *data, size_t length) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700547 CHECK_LE(length, size());
548 memcpy(Data(), data, length);
549 Send(length);
550}
551
552void LocklessQueue::Sender::Send(size_t length) {
Austin Schuh20b2b082019-09-11 20:42:56 -0700553 const size_t queue_size = memory_->queue_size();
Alex Perrycb7da4b2019-08-28 19:35:56 -0700554 CHECK_LE(length, size());
Austin Schuh20b2b082019-09-11 20:42:56 -0700555
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800556 ::aos::ipc_lib::Sender *const sender = memory_->GetSender(sender_index_);
557 // We can do a relaxed load on our sender because we're the only person
558 // modifying it right now.
559 const Index scratch_index = sender->scratch_index.RelaxedLoad();
560 Message *const message = memory_->GetMessage(scratch_index);
Austin Schuh20b2b082019-09-11 20:42:56 -0700561
Austin Schuh20b2b082019-09-11 20:42:56 -0700562 message->header.length = length;
Austin Schuh20b2b082019-09-11 20:42:56 -0700563
564 while (true) {
565 const QueueIndex actual_next_queue_index =
566 memory_->next_queue_index.Load(queue_size);
567 const QueueIndex next_queue_index = ZeroOrValid(actual_next_queue_index);
568
569 const QueueIndex incremented_queue_index = next_queue_index.Increment();
570
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800571 // This needs to synchronize with whoever the previous writer at this
572 // location was.
Austin Schuh20b2b082019-09-11 20:42:56 -0700573 const Index to_replace = memory_->LoadIndex(next_queue_index);
574
575 const QueueIndex decremented_queue_index =
576 next_queue_index.DecrementBy(queue_size);
577
578 // See if we got beat. If we did, try to atomically update
579 // next_queue_index in case the previous writer failed and retry.
580 if (!to_replace.IsPlausible(decremented_queue_index)) {
581 // We don't care about the result. It will either succeed, or we got
582 // beat in fixing it and just need to give up and try again. If we got
583 // beat multiple times, the only way progress can be made is if the queue
584 // is updated as well. This means that if we retry reading
585 // next_queue_index, we will be at most off by one and can retry.
586 //
587 // Both require no further action from us.
588 //
589 // TODO(austin): If we are having fairness issues under contention, we
590 // could have a mode bit in next_queue_index, and could use a lock or some
591 // other form of PI boosting to let the higher priority task win.
592 memory_->next_queue_index.CompareAndExchangeStrong(
593 actual_next_queue_index, incremented_queue_index);
594
Alex Perrycb7da4b2019-08-28 19:35:56 -0700595 VLOG(3) << "We were beat. Try again. Was " << std::hex
596 << to_replace.get() << ", is " << decremented_queue_index.index();
Austin Schuh20b2b082019-09-11 20:42:56 -0700597 continue;
598 }
599
600 // Confirm that the message is what it should be.
601 {
Austin Schuh20b2b082019-09-11 20:42:56 -0700602 const QueueIndex previous_index =
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800603 memory_->GetMessage(to_replace)->header.queue_index.Load(queue_size);
Austin Schuh20b2b082019-09-11 20:42:56 -0700604 if (previous_index != decremented_queue_index && previous_index.valid()) {
605 // Retry.
Alex Perrycb7da4b2019-08-28 19:35:56 -0700606 VLOG(3) << "Something fishy happened, queue index doesn't match. "
607 "Retrying. Previous index was "
608 << std::hex << previous_index.index() << ", should be "
609 << decremented_queue_index.index();
Austin Schuh20b2b082019-09-11 20:42:56 -0700610 continue;
611 }
612 }
613
614 message->header.monotonic_sent_time = ::aos::monotonic_clock::now();
615 message->header.realtime_sent_time = ::aos::realtime_clock::now();
616
617 // Before we are fully done filling out the message, update the Sender state
618 // with the new index to write. This re-uses the barrier for the
619 // queue_index store.
Alex Perrycb7da4b2019-08-28 19:35:56 -0700620 const Index index_to_write(next_queue_index, scratch_index.message_index());
Austin Schuh20b2b082019-09-11 20:42:56 -0700621
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800622 aos_compiler_memory_barrier();
623 // We're the only person who cares about our scratch index, besides somebody
624 // cleaning up after us.
Austin Schuh20b2b082019-09-11 20:42:56 -0700625 sender->scratch_index.RelaxedStore(index_to_write);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800626 aos_compiler_memory_barrier();
Austin Schuh20b2b082019-09-11 20:42:56 -0700627
628 message->header.queue_index.Store(next_queue_index);
629
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800630 aos_compiler_memory_barrier();
Austin Schuh20b2b082019-09-11 20:42:56 -0700631 // The message is now filled out, and we have a confirmed slot to store
632 // into.
633 //
634 // Start by writing down what we are going to pull out of the queue. This
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800635 // was Invalid before now. Only person who will read this is whoever cleans
636 // up after us, so no synchronization necessary.
Austin Schuh20b2b082019-09-11 20:42:56 -0700637 sender->to_replace.RelaxedStore(to_replace);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800638 aos_compiler_memory_barrier();
Austin Schuh20b2b082019-09-11 20:42:56 -0700639
640 // Then exchange the next index into the queue.
641 if (!memory_->GetQueue(next_queue_index.Wrapped())
642 ->CompareAndExchangeStrong(to_replace, index_to_write)) {
643 // Aw, didn't succeed. Retry.
644 sender->to_replace.RelaxedInvalidate();
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800645 aos_compiler_memory_barrier();
Alex Perrycb7da4b2019-08-28 19:35:56 -0700646 VLOG(3) << "Failed to wrap into queue";
Austin Schuh20b2b082019-09-11 20:42:56 -0700647 continue;
648 }
649
650 // Then update next_queue_index to save the next user some computation time.
651 memory_->next_queue_index.CompareAndExchangeStrong(actual_next_queue_index,
652 incremented_queue_index);
653
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800654 aos_compiler_memory_barrier();
Austin Schuh20b2b082019-09-11 20:42:56 -0700655 // Now update the scratch space and record that we succeeded.
656 sender->scratch_index.Store(to_replace);
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800657 aos_compiler_memory_barrier();
658 // And then record that we succeeded, but definitely after the above store.
Austin Schuh20b2b082019-09-11 20:42:56 -0700659 sender->to_replace.RelaxedInvalidate();
660 break;
661 }
662}
663
664LocklessQueue::ReadResult LocklessQueue::Read(
665 uint32_t uint32_queue_index,
666 ::aos::monotonic_clock::time_point *monotonic_sent_time,
667 ::aos::realtime_clock::time_point *realtime_sent_time, size_t *length,
668 char *data) {
669 const size_t queue_size = memory_->queue_size();
670
671 // Build up the QueueIndex.
672 const QueueIndex queue_index =
673 QueueIndex::Zero(queue_size).IncrementBy(uint32_queue_index);
674
675 // Read the message stored at the requested location.
676 Index mi = memory_->LoadIndex(queue_index);
677 Message *m = memory_->GetMessage(mi);
678
679 while (true) {
680 // We need to confirm that the data doesn't change while we are reading it.
681 // Do that by first confirming that the message points to the queue index we
682 // want.
683 const QueueIndex starting_queue_index =
684 m->header.queue_index.Load(queue_size);
685 if (starting_queue_index != queue_index) {
686 // If we found a message that is exactly 1 loop old, we just wrapped.
687 if (starting_queue_index == queue_index.DecrementBy(queue_size)) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700688 VLOG(3) << "Matches: " << std::hex << starting_queue_index.index()
689 << ", " << queue_index.DecrementBy(queue_size).index();
Austin Schuh20b2b082019-09-11 20:42:56 -0700690 return ReadResult::NOTHING_NEW;
691 } else {
692 // Someone has re-used this message between when we pulled it out of the
693 // queue and when we grabbed its index. It is pretty hard to deduce
694 // what happened. Just try again.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800695 Message *const new_m = memory_->GetMessage(queue_index);
Austin Schuh20b2b082019-09-11 20:42:56 -0700696 if (m != new_m) {
697 m = new_m;
Alex Perrycb7da4b2019-08-28 19:35:56 -0700698 VLOG(3) << "Retrying, m doesn't match";
Austin Schuh20b2b082019-09-11 20:42:56 -0700699 continue;
700 }
701
702 // We have confirmed that message still points to the same message. This
703 // means that the message didn't get swapped out from under us, so
704 // starting_queue_index is correct.
705 //
706 // Either we got too far behind (signaled by this being a valid
707 // message), or this is one of the initial messages which are invalid.
708 if (starting_queue_index.valid()) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700709 VLOG(3) << "Too old. Tried for " << std::hex << queue_index.index()
710 << ", got " << starting_queue_index.index() << ", behind by "
711 << std::dec
712 << (starting_queue_index.index() - queue_index.index());
Austin Schuh20b2b082019-09-11 20:42:56 -0700713 return ReadResult::TOO_OLD;
714 }
715
Alex Perrycb7da4b2019-08-28 19:35:56 -0700716 VLOG(3) << "Initial";
Austin Schuh20b2b082019-09-11 20:42:56 -0700717
718 // There isn't a valid message at this location.
719 //
720 // If someone asks for one of the messages within the first go around,
721 // then they need to wait. They got ahead. Otherwise, they are
722 // asking for something crazy, like something before the beginning of
723 // the queue. Tell them that they are behind.
724 if (uint32_queue_index < memory_->queue_size()) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700725 VLOG(3) << "Near zero, " << std::hex << uint32_queue_index;
Austin Schuh20b2b082019-09-11 20:42:56 -0700726 return ReadResult::NOTHING_NEW;
727 } else {
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800728 VLOG(3) << "Not near zero, " << std::hex << uint32_queue_index;
Austin Schuh20b2b082019-09-11 20:42:56 -0700729 return ReadResult::TOO_OLD;
730 }
731 }
732 }
Alex Perrycb7da4b2019-08-28 19:35:56 -0700733 VLOG(3) << "Eq: " << std::hex << starting_queue_index.index() << ", "
734 << queue_index.index();
Austin Schuh20b2b082019-09-11 20:42:56 -0700735 break;
736 }
737
Alex Perrycb7da4b2019-08-28 19:35:56 -0700738 // Then read the data out. Copy it all out to be deterministic and so we can
739 // make length be from either end.
Austin Schuh20b2b082019-09-11 20:42:56 -0700740 *monotonic_sent_time = m->header.monotonic_sent_time;
741 *realtime_sent_time = m->header.realtime_sent_time;
Alex Perrycb7da4b2019-08-28 19:35:56 -0700742 memcpy(data, &m->data[0], message_data_size());
Austin Schuh20b2b082019-09-11 20:42:56 -0700743 *length = m->header.length;
744
745 // And finally, confirm that the message *still* points to the queue index we
746 // want. This means it didn't change out from under us.
747 // If something changed out from under us, we were reading it much too late in
748 // it's lifetime.
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800749 aos_compiler_memory_barrier();
Austin Schuh20b2b082019-09-11 20:42:56 -0700750 const QueueIndex final_queue_index = m->header.queue_index.Load(queue_size);
751 if (final_queue_index != queue_index) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700752 VLOG(3) << "Changed out from under us. Reading " << std::hex
753 << queue_index.index() << ", finished with "
754 << final_queue_index.index() << ", delta: " << std::dec
755 << (final_queue_index.index() - queue_index.index());
756 return ReadResult::OVERWROTE;
Austin Schuh20b2b082019-09-11 20:42:56 -0700757 }
758
759 return ReadResult::GOOD;
760}
761
Alex Perrycb7da4b2019-08-28 19:35:56 -0700762size_t LocklessQueue::queue_size() const { return memory_->queue_size(); }
763size_t LocklessQueue::message_data_size() const {
764 return memory_->message_data_size();
765}
766
767QueueIndex LocklessQueue::LatestQueueIndex() {
Austin Schuh20b2b082019-09-11 20:42:56 -0700768 const size_t queue_size = memory_->queue_size();
769
770 // There is only one interesting case. We need to know if the queue is empty.
771 // That is done with a sentinel value. At worst, this will be off by one.
772 const QueueIndex next_queue_index =
773 memory_->next_queue_index.Load(queue_size);
774 if (next_queue_index.valid()) {
775 const QueueIndex current_queue_index = next_queue_index.DecrementBy(1u);
Alex Perrycb7da4b2019-08-28 19:35:56 -0700776 return current_queue_index;
Austin Schuh20b2b082019-09-11 20:42:56 -0700777 } else {
778 return empty_queue_index();
779 }
780}
781
782namespace {
783
784// Prints out the mutex state. Not safe to use while the mutex is being
785// changed.
786::std::string PrintMutex(aos_mutex *mutex) {
787 ::std::stringstream s;
788 s << "aos_mutex(" << ::std::hex << mutex->futex;
789
790 if (mutex->futex != 0) {
791 s << ":";
792 if (mutex->futex & FUTEX_OWNER_DIED) {
793 s << "FUTEX_OWNER_DIED|";
794 }
795 s << "tid=" << (mutex->futex & FUTEX_TID_MASK);
796 }
797
798 s << ")";
799 return s.str();
800}
801
802} // namespace
803
804void PrintLocklessQueueMemory(LocklessQueueMemory *memory) {
805 const size_t queue_size = memory->queue_size();
806 ::std::cout << "LocklessQueueMemory (" << memory << ") {" << ::std::endl;
807 ::std::cout << " aos_mutex queue_setup_lock = "
808 << PrintMutex(&memory->queue_setup_lock) << ::std::endl;
Brian Silvermanfafe1fa2019-12-18 21:42:18 -0800809 ::std::cout << " bool initialized = " << memory->initialized << ::std::endl;
Austin Schuh20b2b082019-09-11 20:42:56 -0700810 ::std::cout << " config {" << ::std::endl;
811 ::std::cout << " size_t num_watchers = " << memory->config.num_watchers
812 << ::std::endl;
813 ::std::cout << " size_t num_senders = " << memory->config.num_senders
814 << ::std::endl;
815 ::std::cout << " size_t queue_size = " << memory->config.queue_size
816 << ::std::endl;
817 ::std::cout << " size_t message_data_size = "
818 << memory->config.message_data_size << ::std::endl;
819
820 ::std::cout << " AtomicQueueIndex next_queue_index = "
821 << memory->next_queue_index.Load(queue_size).DebugString()
822 << ::std::endl;
823
824 ::std::cout << " }" << ::std::endl;
825 ::std::cout << " AtomicIndex queue[" << queue_size << "] {" << ::std::endl;
826 for (size_t i = 0; i < queue_size; ++i) {
827 ::std::cout << " [" << i << "] -> "
828 << memory->GetQueue(i)->Load().DebugString() << ::std::endl;
829 }
830 ::std::cout << " }" << ::std::endl;
831 ::std::cout << " Message messages[" << memory->num_messages() << "] {"
832 << ::std::endl;
833 for (size_t i = 0; i < memory->num_messages(); ++i) {
834 Message *m = memory->GetMessage(Index(i, i));
835 ::std::cout << " [" << i << "] -> Message {" << ::std::endl;
836 ::std::cout << " Header {" << ::std::endl;
837 ::std::cout << " AtomicQueueIndex queue_index = "
838 << m->header.queue_index.Load(queue_size).DebugString()
839 << ::std::endl;
840 ::std::cout << " size_t length = " << m->header.length
841 << ::std::endl;
842 ::std::cout << " }" << ::std::endl;
843 ::std::cout << " data: {";
844
845 for (size_t j = 0; j < m->header.length; ++j) {
846 char data = m->data[j];
847 if (j != 0) {
848 ::std::cout << " ";
849 }
850 if (::std::isprint(data)) {
851 ::std::cout << ::std::setfill(' ') << ::std::setw(2) << ::std::hex
852 << data;
853 } else {
854 ::std::cout << "0x" << ::std::setfill('0') << ::std::setw(2)
855 << ::std::hex << (static_cast<unsigned>(data) & 0xff);
856 }
857 }
858 ::std::cout << ::std::setfill(' ') << ::std::dec << "}" << ::std::endl;
859 ::std::cout << " }," << ::std::endl;
860 }
861 ::std::cout << " }" << ::std::endl;
862
Alex Perrycb7da4b2019-08-28 19:35:56 -0700863 ::std::cout << " Sender senders[" << memory->num_senders() << "] {"
864 << ::std::endl;
Austin Schuh20b2b082019-09-11 20:42:56 -0700865 for (size_t i = 0; i < memory->num_senders(); ++i) {
866 Sender *s = memory->GetSender(i);
867 ::std::cout << " [" << i << "] -> Sender {" << ::std::endl;
868 ::std::cout << " aos_mutex tid = " << PrintMutex(&s->tid)
869 << ::std::endl;
870 ::std::cout << " AtomicIndex scratch_index = "
871 << s->scratch_index.Load().DebugString() << ::std::endl;
872 ::std::cout << " AtomicIndex to_replace = "
873 << s->to_replace.Load().DebugString() << ::std::endl;
874 ::std::cout << " }" << ::std::endl;
875 }
876 ::std::cout << " }" << ::std::endl;
877
878 ::std::cout << " Watcher watchers[" << memory->num_watchers() << "] {"
879 << ::std::endl;
880 for (size_t i = 0; i < memory->num_watchers(); ++i) {
881 Watcher *w = memory->GetWatcher(i);
882 ::std::cout << " [" << i << "] -> Watcher {" << ::std::endl;
883 ::std::cout << " aos_mutex tid = " << PrintMutex(&w->tid)
884 << ::std::endl;
885 ::std::cout << " pid_t pid = " << w->pid << ::std::endl;
886 ::std::cout << " int priority = " << w->priority << ::std::endl;
887 ::std::cout << " }" << ::std::endl;
888 }
889 ::std::cout << " }" << ::std::endl;
890
891 ::std::cout << "}" << ::std::endl;
892}
893
894} // namespace ipc_lib
895} // namespace aos