blob: c58e2e697fa6ee537432c84ffc7a24818a41c603 [file] [log] [blame]
Alex Perrycb7da4b2019-08-28 19:35:56 -07001#include "aos/realtime.h"
2
Austin Schuhcc6070c2020-10-10 20:25:56 -07003#include <malloc.h>
4#include <sched.h>
Alex Perrycb7da4b2019-08-28 19:35:56 -07005#include <sys/mman.h>
Austin Schuhcc6070c2020-10-10 20:25:56 -07006#include <sys/prctl.h>
Alex Perrycb7da4b2019-08-28 19:35:56 -07007#include <sys/resource.h>
8#include <sys/types.h>
9#include <unistd.h>
Alex Perrycb7da4b2019-08-28 19:35:56 -070010
Tyler Chatowbf0609c2021-07-31 16:13:27 -070011#include <cerrno>
12#include <cstdint>
13#include <cstdio>
14#include <cstdlib>
15#include <cstring>
16
Austin Schuhcc6070c2020-10-10 20:25:56 -070017#include "aos/thread_local.h"
Alex Perrycb7da4b2019-08-28 19:35:56 -070018#include "glog/logging.h"
Austin Schuh62288252020-11-18 23:26:04 -080019#include "glog/raw_logging.h"
Alex Perrycb7da4b2019-08-28 19:35:56 -070020
Austin Schuh62288252020-11-18 23:26:04 -080021DEFINE_bool(
22 die_on_malloc, false,
23 "If true, die when the application allocates memory in a RT section.");
Austin Schuh27553152020-11-18 21:26:37 -080024DEFINE_bool(skip_realtime_scheduler, false,
25 "If true, skip changing the scheduler. Pretend that we changed "
26 "the scheduler instead.");
27DEFINE_bool(skip_locking_memory, false,
28 "If true, skip locking memory. Pretend that we did it instead.");
29
Austin Schuh62288252020-11-18 23:26:04 -080030extern "C" {
Tyler Chatowbf0609c2021-07-31 16:13:27 -070031typedef void (*MallocHook_NewHook)(const void *ptr, size_t size);
Austin Schuh62288252020-11-18 23:26:04 -080032int MallocHook_AddNewHook(MallocHook_NewHook hook) __attribute__((weak));
33int MallocHook_RemoveNewHook(MallocHook_NewHook hook) __attribute__((weak));
34
Tyler Chatowbf0609c2021-07-31 16:13:27 -070035typedef void (*MallocHook_DeleteHook)(const void *ptr);
Austin Schuh62288252020-11-18 23:26:04 -080036int MallocHook_AddDeleteHook(MallocHook_DeleteHook hook) __attribute__((weak));
Tyler Chatowbf0609c2021-07-31 16:13:27 -070037int MallocHook_RemoveDeleteHook(MallocHook_DeleteHook hook)
38 __attribute__((weak));
Tyler Chatow582c6c72021-07-16 13:45:07 -070039
40// Declare tc_malloc weak so we can check if it exists.
41void *tc_malloc(size_t size) __attribute__((weak));
42
43void *__libc_malloc(size_t size);
44void __libc_free(void *ptr);
Tyler Chatowbf0609c2021-07-31 16:13:27 -070045} // extern "C"
Austin Schuh62288252020-11-18 23:26:04 -080046
Alex Perrycb7da4b2019-08-28 19:35:56 -070047namespace FLAG__namespace_do_not_use_directly_use_DECLARE_double_instead {
48extern double FLAGS_tcmalloc_release_rate __attribute__((weak));
49}
50using FLAG__namespace_do_not_use_directly_use_DECLARE_double_instead::
51 FLAGS_tcmalloc_release_rate;
52
53namespace aos {
54namespace logging {
55namespace internal {
56
57// Implemented in aos/logging/context.cc.
58void ReloadThreadName() __attribute__((weak));
59
60} // namespace internal
61} // namespace logging
62
63namespace {
64
Austin Schuh27553152020-11-18 21:26:37 -080065enum class SetLimitForRoot { kYes, kNo };
James Kuszmaulb4874eb2020-01-18 17:50:35 -080066
Austin Schuh27553152020-11-18 21:26:37 -080067enum class AllowSoftLimitDecrease { kYes, kNo };
James Kuszmaulb4874eb2020-01-18 17:50:35 -080068
69void SetSoftRLimit(
70 int resource, rlim64_t soft, SetLimitForRoot set_for_root,
Austin Schuh27553152020-11-18 21:26:37 -080071 std::string_view help_string,
James Kuszmaulb4874eb2020-01-18 17:50:35 -080072 AllowSoftLimitDecrease allow_decrease = AllowSoftLimitDecrease::kYes) {
Alex Perrycb7da4b2019-08-28 19:35:56 -070073 bool am_root = getuid() == 0;
James Kuszmaulb4874eb2020-01-18 17:50:35 -080074 if (set_for_root == SetLimitForRoot::kYes || !am_root) {
Alex Perrycb7da4b2019-08-28 19:35:56 -070075 struct rlimit64 rlim;
76 PCHECK(getrlimit64(resource, &rlim) == 0)
Brian Silverman6a54ff32020-04-28 16:41:39 -070077 << ": getting limit for " << resource;
Alex Perrycb7da4b2019-08-28 19:35:56 -070078
James Kuszmaulb4874eb2020-01-18 17:50:35 -080079 if (allow_decrease == AllowSoftLimitDecrease::kYes) {
80 rlim.rlim_cur = soft;
81 } else {
82 rlim.rlim_cur = std::max(rlim.rlim_cur, soft);
83 }
Alex Perrycb7da4b2019-08-28 19:35:56 -070084 rlim.rlim_max = ::std::max(rlim.rlim_max, soft);
85
86 PCHECK(setrlimit64(resource, &rlim) == 0)
Brian Silverman6a54ff32020-04-28 16:41:39 -070087 << ": changing limit for " << resource << " to " << rlim.rlim_cur
Austin Schuh27553152020-11-18 21:26:37 -080088 << " with max of " << rlim.rlim_max << help_string;
Alex Perrycb7da4b2019-08-28 19:35:56 -070089 }
90}
91
92} // namespace
93
94void LockAllMemory() {
Austin Schuhcc6070c2020-10-10 20:25:56 -070095 CheckNotRealtime();
Alex Perrycb7da4b2019-08-28 19:35:56 -070096 // Allow locking as much as we want into RAM.
Austin Schuh27553152020-11-18 21:26:37 -080097 SetSoftRLimit(RLIMIT_MEMLOCK, RLIM_INFINITY, SetLimitForRoot::kNo,
98 "use --skip_locking_memory to not lock memory.");
Alex Perrycb7da4b2019-08-28 19:35:56 -070099
100 WriteCoreDumps();
Austin Schuh27553152020-11-18 21:26:37 -0800101 PCHECK(mlockall(MCL_CURRENT | MCL_FUTURE) == 0)
102 << ": Failed to lock memory, use --skip_locking_memory to bypass this. "
103 "Bypassing will impact RT performance.";
Alex Perrycb7da4b2019-08-28 19:35:56 -0700104
Brian Silverman4dbbcce2020-09-18 15:27:38 -0700105#if !__has_feature(address_sanitizer) && !__has_feature(memory_sanitizer)
Alex Perrycb7da4b2019-08-28 19:35:56 -0700106 // Don't give freed memory back to the OS.
107 CHECK_EQ(1, mallopt(M_TRIM_THRESHOLD, -1));
108 // Don't use mmap for large malloc chunks.
109 CHECK_EQ(1, mallopt(M_MMAP_MAX, 0));
Austin Schuh85faf672020-09-10 22:58:46 -0700110#endif
Alex Perrycb7da4b2019-08-28 19:35:56 -0700111
112 if (&FLAGS_tcmalloc_release_rate) {
113 // Tell tcmalloc not to return memory.
114 FLAGS_tcmalloc_release_rate = 0.0;
115 }
116
117 // Forces the memory pages for all the stack space that we're ever going to
118 // use to be loaded into memory (so it can be locked there).
119 uint8_t data[4096 * 8];
120 // Not 0 because linux might optimize that to a 0-filled page.
121 memset(data, 1, sizeof(data));
Austin Schuh27553152020-11-18 21:26:37 -0800122 __asm__ __volatile__("" ::"m"(data));
Alex Perrycb7da4b2019-08-28 19:35:56 -0700123
124 static const size_t kHeapPreallocSize = 512 * 1024;
125 char *const heap_data = static_cast<char *>(malloc(kHeapPreallocSize));
126 memset(heap_data, 1, kHeapPreallocSize);
Austin Schuh27553152020-11-18 21:26:37 -0800127 __asm__ __volatile__("" ::"m"(heap_data));
Alex Perrycb7da4b2019-08-28 19:35:56 -0700128 free(heap_data);
129}
130
131void InitRT() {
Austin Schuh27553152020-11-18 21:26:37 -0800132 if (FLAGS_skip_locking_memory) {
133 LOG(WARNING) << "Ignoring request to lock all memory due to "
134 "--skip_locking_memory.";
135 return;
136 }
137
Austin Schuhcc6070c2020-10-10 20:25:56 -0700138 CheckNotRealtime();
Alex Perrycb7da4b2019-08-28 19:35:56 -0700139 LockAllMemory();
140
Austin Schuh27553152020-11-18 21:26:37 -0800141 if (FLAGS_skip_realtime_scheduler) {
142 return;
143 }
Alex Perrycb7da4b2019-08-28 19:35:56 -0700144 // Only let rt processes run for 3 seconds straight.
Austin Schuh27553152020-11-18 21:26:37 -0800145 SetSoftRLimit(
146 RLIMIT_RTTIME, 3000000, SetLimitForRoot::kYes,
147 ", use --skip_realtime_scheduler to stay non-rt and bypass this "
148 "warning.");
Alex Perrycb7da4b2019-08-28 19:35:56 -0700149
150 // Allow rt processes up to priority 40.
Austin Schuh27553152020-11-18 21:26:37 -0800151 SetSoftRLimit(
152 RLIMIT_RTPRIO, 40, SetLimitForRoot::kNo,
153 ", use --skip_realtime_scheduler to stay non-rt and bypass this "
154 "warning.");
Alex Perrycb7da4b2019-08-28 19:35:56 -0700155}
156
157void UnsetCurrentThreadRealtimePriority() {
158 struct sched_param param;
159 param.sched_priority = 0;
Brian Silverman6a54ff32020-04-28 16:41:39 -0700160 PCHECK(sched_setscheduler(0, SCHED_OTHER, &param) == 0);
Austin Schuhcc6070c2020-10-10 20:25:56 -0700161 MarkRealtime(false);
Brian Silverman6a54ff32020-04-28 16:41:39 -0700162}
163
164void SetCurrentThreadAffinity(const cpu_set_t &cpuset) {
165 PCHECK(sched_setaffinity(0, sizeof(cpuset), &cpuset) == 0);
Alex Perrycb7da4b2019-08-28 19:35:56 -0700166}
167
James Kuszmaul57c2baa2020-01-19 14:52:52 -0800168void SetCurrentThreadName(const std::string_view name) {
Alex Perrycb7da4b2019-08-28 19:35:56 -0700169 CHECK_LE(name.size(), 16u) << ": thread name '" << name << "' too long";
170 VLOG(1) << "This thread is changing to '" << name << "'";
James Kuszmaul57c2baa2020-01-19 14:52:52 -0800171 std::string string_name(name);
Brian Silverman6a54ff32020-04-28 16:41:39 -0700172 PCHECK(prctl(PR_SET_NAME, string_name.c_str()) == 0)
173 << ": changing name to " << string_name;
Alex Perrycb7da4b2019-08-28 19:35:56 -0700174 if (&logging::internal::ReloadThreadName != nullptr) {
175 logging::internal::ReloadThreadName();
176 }
177}
178
Austin Schuhde973292021-10-12 18:09:49 -0700179cpu_set_t GetCurrentThreadAffinity() {
180 cpu_set_t result;
181 PCHECK(sched_getaffinity(0, sizeof(result), &result) == 0);
182 return result;
183}
184
Alex Perrycb7da4b2019-08-28 19:35:56 -0700185void SetCurrentThreadRealtimePriority(int priority) {
Austin Schuh27553152020-11-18 21:26:37 -0800186 if (FLAGS_skip_realtime_scheduler) {
187 LOG(WARNING) << "Ignoring request to switch to the RT scheduler due to "
188 "--skip_realtime_scheduler.";
189 return;
190 }
Alex Perrycb7da4b2019-08-28 19:35:56 -0700191 // Make sure we will only be allowed to run for 3 seconds straight.
Austin Schuh27553152020-11-18 21:26:37 -0800192 SetSoftRLimit(
193 RLIMIT_RTTIME, 3000000, SetLimitForRoot::kYes,
194 ", use --skip_realtime_scheduler to stay non-rt and bypass this "
195 "warning.");
Alex Perrycb7da4b2019-08-28 19:35:56 -0700196
Brian Silvermanb3826f52020-07-02 19:41:18 -0700197 // Raise our soft rlimit if necessary.
Austin Schuh27553152020-11-18 21:26:37 -0800198 SetSoftRLimit(
199 RLIMIT_RTPRIO, priority, SetLimitForRoot::kNo,
200 ", use --skip_realtime_scheduler to stay non-rt and bypass this "
201 "warning.",
202 AllowSoftLimitDecrease::kNo);
Brian Silvermanb3826f52020-07-02 19:41:18 -0700203
Alex Perrycb7da4b2019-08-28 19:35:56 -0700204 struct sched_param param;
205 param.sched_priority = priority;
Austin Schuhcc6070c2020-10-10 20:25:56 -0700206 MarkRealtime(true);
Alex Perrycb7da4b2019-08-28 19:35:56 -0700207 PCHECK(sched_setscheduler(0, SCHED_FIFO, &param) == 0)
Austin Schuh27553152020-11-18 21:26:37 -0800208 << ": changing to SCHED_FIFO with " << priority
209 << ", if you want to bypass this check for testing, use "
210 "--skip_realtime_scheduler";
Alex Perrycb7da4b2019-08-28 19:35:56 -0700211}
212
213void WriteCoreDumps() {
214 // Do create core files of unlimited size.
Austin Schuh27553152020-11-18 21:26:37 -0800215 SetSoftRLimit(RLIMIT_CORE, RLIM_INFINITY, SetLimitForRoot::kYes, "");
James Kuszmaulb4874eb2020-01-18 17:50:35 -0800216}
217
218void ExpandStackSize() {
Austin Schuh27553152020-11-18 21:26:37 -0800219 SetSoftRLimit(RLIMIT_STACK, 1000000, SetLimitForRoot::kYes, "",
James Kuszmaulb4874eb2020-01-18 17:50:35 -0800220 AllowSoftLimitDecrease::kNo);
Alex Perrycb7da4b2019-08-28 19:35:56 -0700221}
222
Austin Schuhcc6070c2020-10-10 20:25:56 -0700223namespace {
Austin Schuhf239e332021-07-30 15:27:26 -0700224// Bool to track if malloc hooks have failed to be configured.
225bool has_malloc_hook = true;
Austin Schuhcc6070c2020-10-10 20:25:56 -0700226AOS_THREAD_LOCAL bool is_realtime = false;
Tyler Chatowbf0609c2021-07-31 16:13:27 -0700227} // namespace
Austin Schuhcc6070c2020-10-10 20:25:56 -0700228
229bool MarkRealtime(bool realtime) {
Austin Schuhf239e332021-07-30 15:27:26 -0700230 if (realtime) {
231 // For some applications (generally tools built for the host in Bazel), we
232 // don't have malloc hooks available, but we also don't go realtime. Delay
233 // complaining in that case until we try to go RT and it matters.
234 CHECK(has_malloc_hook)
235 << ": Failed to register required malloc hooks before going realtime. "
236 "Disable --die_on_malloc to continue.";
237 }
Austin Schuhcc6070c2020-10-10 20:25:56 -0700238 const bool prior = is_realtime;
239 is_realtime = realtime;
240 return prior;
241}
242
243void CheckRealtime() { CHECK(is_realtime); }
244
245void CheckNotRealtime() { CHECK(!is_realtime); }
246
247ScopedRealtimeRestorer::ScopedRealtimeRestorer() : prior_(is_realtime) {}
248
Austin Schuh62288252020-11-18 23:26:04 -0800249void NewHook(const void *ptr, size_t size) {
250 if (is_realtime) {
251 is_realtime = false;
252 RAW_LOG(FATAL, "Malloced %p -> %zu bytes", ptr, size);
253 }
254}
255
256void DeleteHook(const void *ptr) {
Austin Schuhf239e332021-07-30 15:27:26 -0700257 // It is legal to call free(nullptr) unconditionally and assume that it won't
258 // do anything. Eigen does this. So, if we are RT, ignore any of these
259 // calls.
260 if (is_realtime && ptr != nullptr) {
Austin Schuh62288252020-11-18 23:26:04 -0800261 is_realtime = false;
262 RAW_LOG(FATAL, "Delete Hook %p", ptr);
263 }
264}
265
Tyler Chatow582c6c72021-07-16 13:45:07 -0700266extern "C" {
267
268// malloc hooks for libc. Tcmalloc will replace everything it finds (malloc,
269// __libc_malloc, etc.), so we need its specific hook above as well.
270void *aos_malloc_hook(size_t size) {
271 if (FLAGS_die_on_malloc && aos::is_realtime) {
272 aos::is_realtime = false;
273 RAW_LOG(FATAL, "Malloced %zu bytes", size);
274 return nullptr;
275 } else {
276 return __libc_malloc(size);
277 }
278}
279
280void aos_free_hook(void *ptr) {
281 if (FLAGS_die_on_malloc && aos::is_realtime && ptr != nullptr) {
282 aos::is_realtime = false;
283 RAW_LOG(FATAL, "Deleted %p", ptr);
284 } else {
285 __libc_free(ptr);
286 }
287}
288
289void *malloc(size_t size) __attribute__((weak, alias("aos_malloc_hook")));
290void free(void *ptr) __attribute__((weak, alias("aos_free_hook")));
291
292}
293
Austin Schuh62288252020-11-18 23:26:04 -0800294void RegisterMallocHook() {
295 if (FLAGS_die_on_malloc) {
Tyler Chatow582c6c72021-07-16 13:45:07 -0700296 // tcmalloc redefines __libc_malloc, so use this as a feature test.
297 if (&__libc_malloc == &tc_malloc) {
298 RAW_LOG(INFO, "Hooking tcmalloc for die_on_malloc");
299 if (&MallocHook_AddNewHook != nullptr) {
300 CHECK(MallocHook_AddNewHook(&NewHook));
301 } else {
302 has_malloc_hook = false;
303 }
304 if (&MallocHook_AddDeleteHook != nullptr) {
305 CHECK(MallocHook_AddDeleteHook(&DeleteHook));
306 } else {
307 has_malloc_hook = false;
308 }
Austin Schuh62288252020-11-18 23:26:04 -0800309 } else {
Tyler Chatow582c6c72021-07-16 13:45:07 -0700310 RAW_LOG(INFO, "Replacing glibc malloc");
311 if (&malloc != &aos_malloc_hook) {
312 has_malloc_hook = false;
313 }
314 if (&free != &aos_free_hook) {
315 has_malloc_hook = false;
316 }
Austin Schuh62288252020-11-18 23:26:04 -0800317 }
318 }
319}
320
Alex Perrycb7da4b2019-08-28 19:35:56 -0700321} // namespace aos