2019-11-14 19:02:54 +01:00
|
|
|
// SPDX-License-Identifier: GPL-2.0
|
2021-01-15 18:09:53 +01:00
|
|
|
/*
|
|
|
|
* KCSAN core runtime.
|
|
|
|
*
|
|
|
|
* Copyright (C) 2019, Google LLC.
|
|
|
|
*/
|
2019-11-14 19:02:54 +01:00
|
|
|
|
2020-07-31 10:17:22 +02:00
|
|
|
#define pr_fmt(fmt) "kcsan: " fmt
|
|
|
|
|
2019-11-14 19:02:54 +01:00
|
|
|
#include <linux/atomic.h>
|
|
|
|
#include <linux/bug.h>
|
|
|
|
#include <linux/delay.h>
|
|
|
|
#include <linux/export.h>
|
|
|
|
#include <linux/init.h>
|
2020-02-04 18:21:10 +01:00
|
|
|
#include <linux/kernel.h>
|
kcsan: Add support for scoped accesses
This adds support for scoped accesses, where the memory range is checked
for the duration of the scope. The feature is implemented by inserting
the relevant access information into a list of scoped accesses for
the current execution context, which are then checked (until removed)
on every call (through instrumentation) into the KCSAN runtime.
An alternative, more complex, implementation could set up a watchpoint for
the scoped access, and keep the watchpoint set up. This, however, would
require first exposing a handle to the watchpoint, as well as dealing
with cases such as accesses by the same thread while the watchpoint is
still set up (and several more cases). It is also doubtful if this would
provide any benefit, since the majority of delay where the watchpoint
is set up is likely due to the injected delays by KCSAN. Therefore,
the implementation in this patch is simpler and avoids hurting KCSAN's
main use-case (normal data race detection); it also implicitly increases
scoped-access race-detection-ability due to increased probability of
setting up watchpoints by repeatedly calling __kcsan_check_access()
throughout the scope of the access.
The implementation required adding an additional conditional branch to
the fast-path. However, the microbenchmark showed a *speedup* of ~5%
on the fast-path. This appears to be due to subtly improved codegen by
GCC from moving get_ctx() and associated load of preempt_count earlier.
Suggested-by: Boqun Feng <boqun.feng@gmail.com>
Suggested-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-03-25 17:41:56 +01:00
|
|
|
#include <linux/list.h>
|
2020-02-07 19:59:10 +01:00
|
|
|
#include <linux/moduleparam.h>
|
2019-11-14 19:02:54 +01:00
|
|
|
#include <linux/percpu.h>
|
|
|
|
#include <linux/preempt.h>
|
|
|
|
#include <linux/sched.h>
|
|
|
|
#include <linux/uaccess.h>
|
|
|
|
|
|
|
|
#include "encoding.h"
|
|
|
|
#include "kcsan.h"
|
2021-06-07 14:56:51 +02:00
|
|
|
#include "permissive.h"
|
2019-11-14 19:02:54 +01:00
|
|
|
|
2020-02-07 19:59:10 +01:00
|
|
|
static bool kcsan_early_enable = IS_ENABLED(CONFIG_KCSAN_EARLY_ENABLE);
|
2020-02-22 00:10:27 +01:00
|
|
|
unsigned int kcsan_udelay_task = CONFIG_KCSAN_UDELAY_TASK;
|
|
|
|
unsigned int kcsan_udelay_interrupt = CONFIG_KCSAN_UDELAY_INTERRUPT;
|
2020-02-07 19:59:10 +01:00
|
|
|
static long kcsan_skip_watch = CONFIG_KCSAN_SKIP_WATCH;
|
2020-02-21 23:02:09 +01:00
|
|
|
static bool kcsan_interrupt_watcher = IS_ENABLED(CONFIG_KCSAN_INTERRUPT_WATCHER);
|
2020-02-07 19:59:10 +01:00
|
|
|
|
|
|
|
#ifdef MODULE_PARAM_PREFIX
|
|
|
|
#undef MODULE_PARAM_PREFIX
|
|
|
|
#endif
|
|
|
|
#define MODULE_PARAM_PREFIX "kcsan."
|
|
|
|
module_param_named(early_enable, kcsan_early_enable, bool, 0);
|
|
|
|
module_param_named(udelay_task, kcsan_udelay_task, uint, 0644);
|
|
|
|
module_param_named(udelay_interrupt, kcsan_udelay_interrupt, uint, 0644);
|
|
|
|
module_param_named(skip_watch, kcsan_skip_watch, long, 0644);
|
2020-02-21 23:02:09 +01:00
|
|
|
module_param_named(interrupt_watcher, kcsan_interrupt_watcher, bool, 0444);
|
2020-02-07 19:59:10 +01:00
|
|
|
|
2021-08-05 14:57:45 +02:00
|
|
|
#ifdef CONFIG_KCSAN_WEAK_MEMORY
|
|
|
|
static bool kcsan_weak_memory = true;
|
|
|
|
module_param_named(weak_memory, kcsan_weak_memory, bool, 0644);
|
|
|
|
#else
|
|
|
|
#define kcsan_weak_memory false
|
|
|
|
#endif
|
|
|
|
|
2019-11-14 19:02:54 +01:00
|
|
|
bool kcsan_enabled;
|
|
|
|
|
|
|
|
/* Per-CPU kcsan_ctx for interrupts */
|
|
|
|
static DEFINE_PER_CPU(struct kcsan_ctx, kcsan_cpu_ctx) = {
|
kcsan: Add support for scoped accesses
This adds support for scoped accesses, where the memory range is checked
for the duration of the scope. The feature is implemented by inserting
the relevant access information into a list of scoped accesses for
the current execution context, which are then checked (until removed)
on every call (through instrumentation) into the KCSAN runtime.
An alternative, more complex, implementation could set up a watchpoint for
the scoped access, and keep the watchpoint set up. This, however, would
require first exposing a handle to the watchpoint, as well as dealing
with cases such as accesses by the same thread while the watchpoint is
still set up (and several more cases). It is also doubtful if this would
provide any benefit, since the majority of delay where the watchpoint
is set up is likely due to the injected delays by KCSAN. Therefore,
the implementation in this patch is simpler and avoids hurting KCSAN's
main use-case (normal data race detection); it also implicitly increases
scoped-access race-detection-ability due to increased probability of
setting up watchpoints by repeatedly calling __kcsan_check_access()
throughout the scope of the access.
The implementation required adding an additional conditional branch to
the fast-path. However, the microbenchmark showed a *speedup* of ~5%
on the fast-path. This appears to be due to subtly improved codegen by
GCC from moving get_ctx() and associated load of preempt_count earlier.
Suggested-by: Boqun Feng <boqun.feng@gmail.com>
Suggested-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-03-25 17:41:56 +01:00
|
|
|
.scoped_accesses = {LIST_POISON1, NULL},
|
2019-11-14 19:02:54 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
/*
|
2020-03-05 15:21:07 +01:00
|
|
|
* Helper macros to index into adjacent slots, starting from address slot
|
2019-11-14 19:02:54 +01:00
|
|
|
* itself, followed by the right and left slots.
|
|
|
|
*
|
|
|
|
* The purpose is 2-fold:
|
|
|
|
*
|
|
|
|
* 1. if during insertion the address slot is already occupied, check if
|
|
|
|
* any adjacent slots are free;
|
|
|
|
* 2. accesses that straddle a slot boundary due to size that exceeds a
|
|
|
|
* slot's range may check adjacent slots if any watchpoint matches.
|
|
|
|
*
|
|
|
|
* Note that accesses with very large size may still miss a watchpoint; however,
|
|
|
|
* given this should be rare, this is a reasonable trade-off to make, since this
|
|
|
|
* will avoid:
|
|
|
|
*
|
|
|
|
* 1. excessive contention between watchpoint checks and setup;
|
|
|
|
* 2. larger number of simultaneous watchpoints without sacrificing
|
|
|
|
* performance.
|
|
|
|
*
|
|
|
|
* Example: SLOT_IDX values for KCSAN_CHECK_ADJACENT=1, where i is [0, 1, 2]:
|
|
|
|
*
|
|
|
|
* slot=0: [ 1, 2, 0]
|
|
|
|
* slot=9: [10, 11, 9]
|
|
|
|
* slot=63: [64, 65, 63]
|
|
|
|
*/
|
|
|
|
#define SLOT_IDX(slot, i) (slot + ((i + KCSAN_CHECK_ADJACENT) % NUM_SLOTS))
|
|
|
|
|
|
|
|
/*
|
2019-11-20 10:41:43 +01:00
|
|
|
* SLOT_IDX_FAST is used in the fast-path. Not first checking the address's primary
|
kcsan: Introduce KCSAN_ACCESS_ASSERT access type
The KCSAN_ACCESS_ASSERT access type may be used to introduce dummy reads
and writes to assert certain properties of concurrent code, where bugs
could not be detected as normal data races.
For example, a variable that is only meant to be written by a single
CPU, but may be read (without locking) by other CPUs must still be
marked properly to avoid data races. However, concurrent writes,
regardless if WRITE_ONCE() or not, would be a bug. Using
kcsan_check_access(&x, sizeof(x), KCSAN_ACCESS_ASSERT) would allow
catching such bugs.
To support KCSAN_ACCESS_ASSERT the following notable changes were made:
* If an access is of type KCSAN_ASSERT_ACCESS, disable various filters
that only apply to data races, so that all races that KCSAN observes are
reported.
* Bug reports that involve an ASSERT access type will be reported as
"KCSAN: assert: race in ..." instead of "data-race"; this will help
more easily distinguish them.
* Update a few comments to just mention 'races' where we do not always
mean pure data races.
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2020-02-06 16:46:24 +01:00
|
|
|
* slot (middle) is fine if we assume that races occur rarely. The set of
|
2019-11-14 19:02:54 +01:00
|
|
|
* indices {SLOT_IDX(slot, i) | i in [0, NUM_SLOTS)} is equivalent to
|
|
|
|
* {SLOT_IDX_FAST(slot, i) | i in [0, NUM_SLOTS)}.
|
|
|
|
*/
|
|
|
|
#define SLOT_IDX_FAST(slot, i) (slot + i)
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Watchpoints, with each entry encoded as defined in encoding.h: in order to be
|
|
|
|
* able to safely update and access a watchpoint without introducing locking
|
|
|
|
* overhead, we encode each watchpoint as a single atomic long. The initial
|
|
|
|
* zero-initialized state matches INVALID_WATCHPOINT.
|
|
|
|
*
|
|
|
|
* Add NUM_SLOTS-1 entries to account for overflow; this helps avoid having to
|
2019-11-20 10:41:43 +01:00
|
|
|
* use more complicated SLOT_IDX_FAST calculation with modulo in the fast-path.
|
2019-11-14 19:02:54 +01:00
|
|
|
*/
|
2019-11-20 10:41:43 +01:00
|
|
|
static atomic_long_t watchpoints[CONFIG_KCSAN_NUM_WATCHPOINTS + NUM_SLOTS-1];
|
2019-11-14 19:02:54 +01:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Instructions to skip watching counter, used in should_watch(). We use a
|
|
|
|
* per-CPU counter to avoid excessive contention.
|
|
|
|
*/
|
|
|
|
static DEFINE_PER_CPU(long, kcsan_skip);
|
|
|
|
|
2020-08-21 14:31:26 +02:00
|
|
|
/* For kcsan_prandom_u32_max(). */
|
2020-11-24 12:02:09 +01:00
|
|
|
static DEFINE_PER_CPU(u32, kcsan_rand_state);
|
2020-08-21 14:31:26 +02:00
|
|
|
|
2020-01-07 17:31:04 +01:00
|
|
|
static __always_inline atomic_long_t *find_watchpoint(unsigned long addr,
|
|
|
|
size_t size,
|
|
|
|
bool expect_write,
|
|
|
|
long *encoded_watchpoint)
|
2019-11-14 19:02:54 +01:00
|
|
|
{
|
|
|
|
const int slot = watchpoint_slot(addr);
|
|
|
|
const unsigned long addr_masked = addr & WATCHPOINT_ADDR_MASK;
|
|
|
|
atomic_long_t *watchpoint;
|
|
|
|
unsigned long wp_addr_masked;
|
|
|
|
size_t wp_size;
|
|
|
|
bool is_write;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
BUILD_BUG_ON(CONFIG_KCSAN_NUM_WATCHPOINTS < NUM_SLOTS);
|
|
|
|
|
|
|
|
for (i = 0; i < NUM_SLOTS; ++i) {
|
|
|
|
watchpoint = &watchpoints[SLOT_IDX_FAST(slot, i)];
|
|
|
|
*encoded_watchpoint = atomic_long_read(watchpoint);
|
|
|
|
if (!decode_watchpoint(*encoded_watchpoint, &wp_addr_masked,
|
|
|
|
&wp_size, &is_write))
|
|
|
|
continue;
|
|
|
|
|
|
|
|
if (expect_write && !is_write)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
/* Check if the watchpoint matches the access. */
|
|
|
|
if (matching_access(wp_addr_masked, wp_size, addr_masked, size))
|
|
|
|
return watchpoint;
|
|
|
|
}
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2019-11-20 10:41:43 +01:00
|
|
|
static inline atomic_long_t *
|
|
|
|
insert_watchpoint(unsigned long addr, size_t size, bool is_write)
|
2019-11-14 19:02:54 +01:00
|
|
|
{
|
|
|
|
const int slot = watchpoint_slot(addr);
|
|
|
|
const long encoded_watchpoint = encode_watchpoint(addr, size, is_write);
|
|
|
|
atomic_long_t *watchpoint;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
/* Check slot index logic, ensuring we stay within array bounds. */
|
|
|
|
BUILD_BUG_ON(SLOT_IDX(0, 0) != KCSAN_CHECK_ADJACENT);
|
2019-11-20 10:41:43 +01:00
|
|
|
BUILD_BUG_ON(SLOT_IDX(0, KCSAN_CHECK_ADJACENT+1) != 0);
|
|
|
|
BUILD_BUG_ON(SLOT_IDX(CONFIG_KCSAN_NUM_WATCHPOINTS-1, KCSAN_CHECK_ADJACENT) != ARRAY_SIZE(watchpoints)-1);
|
|
|
|
BUILD_BUG_ON(SLOT_IDX(CONFIG_KCSAN_NUM_WATCHPOINTS-1, KCSAN_CHECK_ADJACENT+1) != ARRAY_SIZE(watchpoints) - NUM_SLOTS);
|
2019-11-14 19:02:54 +01:00
|
|
|
|
|
|
|
for (i = 0; i < NUM_SLOTS; ++i) {
|
|
|
|
long expect_val = INVALID_WATCHPOINT;
|
|
|
|
|
|
|
|
/* Try to acquire this slot. */
|
|
|
|
watchpoint = &watchpoints[SLOT_IDX(slot, i)];
|
2019-11-20 10:41:43 +01:00
|
|
|
if (atomic_long_try_cmpxchg_relaxed(watchpoint, &expect_val, encoded_watchpoint))
|
2019-11-14 19:02:54 +01:00
|
|
|
return watchpoint;
|
|
|
|
}
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Return true if watchpoint was successfully consumed, false otherwise.
|
|
|
|
*
|
|
|
|
* This may return false if:
|
|
|
|
*
|
|
|
|
* 1. another thread already consumed the watchpoint;
|
|
|
|
* 2. the thread that set up the watchpoint already removed it;
|
|
|
|
* 3. the watchpoint was removed and then re-used.
|
|
|
|
*/
|
2020-01-07 17:31:04 +01:00
|
|
|
static __always_inline bool
|
2019-11-20 10:41:43 +01:00
|
|
|
try_consume_watchpoint(atomic_long_t *watchpoint, long encoded_watchpoint)
|
2019-11-14 19:02:54 +01:00
|
|
|
{
|
2019-11-20 10:41:43 +01:00
|
|
|
return atomic_long_try_cmpxchg_relaxed(watchpoint, &encoded_watchpoint, CONSUMED_WATCHPOINT);
|
2019-11-14 19:02:54 +01:00
|
|
|
}
|
|
|
|
|
kcsan: Avoid blocking producers in prepare_report()
To avoid deadlock in case watchers can be interrupted, we need to ensure
that producers of the struct other_info can never be blocked by an
unrelated consumer. (Likely to occur with KCSAN_INTERRUPT_WATCHER.)
There are several cases that can lead to this scenario, for example:
1. A watchpoint A was set up by task T1, but interrupted by
interrupt I1. Some other thread (task or interrupt) finds
watchpoint A consumes it, and sets other_info. Then I1 also
finds some unrelated watchpoint B, consumes it, but is blocked
because other_info is in use. T1 cannot consume other_info
because I1 never returns -> deadlock.
2. A watchpoint A was set up by task T1, but interrupted by
interrupt I1, which also sets up a watchpoint B. Some other
thread finds watchpoint A, and consumes it and sets up
other_info with its information. Similarly some other thread
finds watchpoint B and consumes it, but is then blocked because
other_info is in use. When I1 continues it sees its watchpoint
was consumed, and that it must wait for other_info, which
currently contains information to be consumed by T1. However, T1
cannot unblock other_info because I1 never returns -> deadlock.
To avoid this, we need to ensure that producers of struct other_info
always have a usable other_info entry. This is obviously not the case
with only a single instance of struct other_info, as concurrent
producers must wait for the entry to be released by some consumer (which
may be locked up as illustrated above).
While it would be nice if producers could simply call kmalloc() and
append their instance of struct other_info to a list, we are very
limited in this code path: since KCSAN can instrument the allocators
themselves, calling kmalloc() could lead to deadlock or corrupted
allocator state.
Since producers of the struct other_info will always succeed at
try_consume_watchpoint(), preceding the call into kcsan_report(), we
know that the particular watchpoint slot cannot simply be reused or
consumed by another potential other_info producer. If we move removal of
a watchpoint after reporting (by the consumer of struct other_info), we
can see a consumed watchpoint as a held lock on elements of other_info,
if we create a one-to-one mapping of a watchpoint to an other_info
element.
Therefore, the simplest solution is to create an array of struct
other_info that is as large as the watchpoints array in core.c, and pass
the watchpoint index to kcsan_report() for producers and consumers, and
change watchpoints to be removed after reporting is done.
With a default config on a 64-bit system, the array other_infos consumes
~37KiB. For most systems today this is not a problem. On smaller memory
constrained systems, the config value CONFIG_KCSAN_NUM_WATCHPOINTS can
be reduced appropriately.
Overall, this change is a simplification of the prepare_report() code,
and makes some of the checks (such as checking if at least one access is
a write) redundant.
Tested:
$ tools/testing/selftests/rcutorture/bin/kvm.sh \
--cpus 12 --duration 10 --kconfig "CONFIG_DEBUG_INFO=y \
CONFIG_KCSAN=y CONFIG_KCSAN_ASSUME_PLAIN_WRITES_ATOMIC=n \
CONFIG_KCSAN_REPORT_VALUE_CHANGE_ONLY=n \
CONFIG_KCSAN_REPORT_ONCE_IN_MS=100000 CONFIG_KCSAN_VERBOSE=y \
CONFIG_KCSAN_INTERRUPT_WATCHER=y CONFIG_PROVE_LOCKING=y" \
--configs TREE03
=> No longer hangs and runs to completion as expected.
Reported-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-03-18 18:38:45 +01:00
|
|
|
/* Return true if watchpoint was not touched, false if already consumed. */
|
|
|
|
static inline bool consume_watchpoint(atomic_long_t *watchpoint)
|
2019-11-14 19:02:54 +01:00
|
|
|
{
|
kcsan: Avoid blocking producers in prepare_report()
To avoid deadlock in case watchers can be interrupted, we need to ensure
that producers of the struct other_info can never be blocked by an
unrelated consumer. (Likely to occur with KCSAN_INTERRUPT_WATCHER.)
There are several cases that can lead to this scenario, for example:
1. A watchpoint A was set up by task T1, but interrupted by
interrupt I1. Some other thread (task or interrupt) finds
watchpoint A consumes it, and sets other_info. Then I1 also
finds some unrelated watchpoint B, consumes it, but is blocked
because other_info is in use. T1 cannot consume other_info
because I1 never returns -> deadlock.
2. A watchpoint A was set up by task T1, but interrupted by
interrupt I1, which also sets up a watchpoint B. Some other
thread finds watchpoint A, and consumes it and sets up
other_info with its information. Similarly some other thread
finds watchpoint B and consumes it, but is then blocked because
other_info is in use. When I1 continues it sees its watchpoint
was consumed, and that it must wait for other_info, which
currently contains information to be consumed by T1. However, T1
cannot unblock other_info because I1 never returns -> deadlock.
To avoid this, we need to ensure that producers of struct other_info
always have a usable other_info entry. This is obviously not the case
with only a single instance of struct other_info, as concurrent
producers must wait for the entry to be released by some consumer (which
may be locked up as illustrated above).
While it would be nice if producers could simply call kmalloc() and
append their instance of struct other_info to a list, we are very
limited in this code path: since KCSAN can instrument the allocators
themselves, calling kmalloc() could lead to deadlock or corrupted
allocator state.
Since producers of the struct other_info will always succeed at
try_consume_watchpoint(), preceding the call into kcsan_report(), we
know that the particular watchpoint slot cannot simply be reused or
consumed by another potential other_info producer. If we move removal of
a watchpoint after reporting (by the consumer of struct other_info), we
can see a consumed watchpoint as a held lock on elements of other_info,
if we create a one-to-one mapping of a watchpoint to an other_info
element.
Therefore, the simplest solution is to create an array of struct
other_info that is as large as the watchpoints array in core.c, and pass
the watchpoint index to kcsan_report() for producers and consumers, and
change watchpoints to be removed after reporting is done.
With a default config on a 64-bit system, the array other_infos consumes
~37KiB. For most systems today this is not a problem. On smaller memory
constrained systems, the config value CONFIG_KCSAN_NUM_WATCHPOINTS can
be reduced appropriately.
Overall, this change is a simplification of the prepare_report() code,
and makes some of the checks (such as checking if at least one access is
a write) redundant.
Tested:
$ tools/testing/selftests/rcutorture/bin/kvm.sh \
--cpus 12 --duration 10 --kconfig "CONFIG_DEBUG_INFO=y \
CONFIG_KCSAN=y CONFIG_KCSAN_ASSUME_PLAIN_WRITES_ATOMIC=n \
CONFIG_KCSAN_REPORT_VALUE_CHANGE_ONLY=n \
CONFIG_KCSAN_REPORT_ONCE_IN_MS=100000 CONFIG_KCSAN_VERBOSE=y \
CONFIG_KCSAN_INTERRUPT_WATCHER=y CONFIG_PROVE_LOCKING=y" \
--configs TREE03
=> No longer hangs and runs to completion as expected.
Reported-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-03-18 18:38:45 +01:00
|
|
|
return atomic_long_xchg_relaxed(watchpoint, CONSUMED_WATCHPOINT) != CONSUMED_WATCHPOINT;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Remove the watchpoint -- its slot may be reused after. */
|
|
|
|
static inline void remove_watchpoint(atomic_long_t *watchpoint)
|
|
|
|
{
|
|
|
|
atomic_long_set(watchpoint, INVALID_WATCHPOINT);
|
2019-11-14 19:02:54 +01:00
|
|
|
}
|
|
|
|
|
2020-01-07 17:31:04 +01:00
|
|
|
static __always_inline struct kcsan_ctx *get_ctx(void)
|
2019-11-14 19:02:54 +01:00
|
|
|
{
|
|
|
|
/*
|
2019-11-20 10:41:43 +01:00
|
|
|
* In interrupts, use raw_cpu_ptr to avoid unnecessary checks, that would
|
2019-11-14 19:02:54 +01:00
|
|
|
* also result in calls that generate warnings in uaccess regions.
|
|
|
|
*/
|
|
|
|
return in_task() ? ¤t->kcsan_ctx : raw_cpu_ptr(&kcsan_cpu_ctx);
|
|
|
|
}
|
|
|
|
|
2021-08-09 13:25:13 +02:00
|
|
|
static __always_inline void
|
|
|
|
check_access(const volatile void *ptr, size_t size, int type, unsigned long ip);
|
|
|
|
|
kcsan: Add support for scoped accesses
This adds support for scoped accesses, where the memory range is checked
for the duration of the scope. The feature is implemented by inserting
the relevant access information into a list of scoped accesses for
the current execution context, which are then checked (until removed)
on every call (through instrumentation) into the KCSAN runtime.
An alternative, more complex, implementation could set up a watchpoint for
the scoped access, and keep the watchpoint set up. This, however, would
require first exposing a handle to the watchpoint, as well as dealing
with cases such as accesses by the same thread while the watchpoint is
still set up (and several more cases). It is also doubtful if this would
provide any benefit, since the majority of delay where the watchpoint
is set up is likely due to the injected delays by KCSAN. Therefore,
the implementation in this patch is simpler and avoids hurting KCSAN's
main use-case (normal data race detection); it also implicitly increases
scoped-access race-detection-ability due to increased probability of
setting up watchpoints by repeatedly calling __kcsan_check_access()
throughout the scope of the access.
The implementation required adding an additional conditional branch to
the fast-path. However, the microbenchmark showed a *speedup* of ~5%
on the fast-path. This appears to be due to subtly improved codegen by
GCC from moving get_ctx() and associated load of preempt_count earlier.
Suggested-by: Boqun Feng <boqun.feng@gmail.com>
Suggested-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-03-25 17:41:56 +01:00
|
|
|
/* Check scoped accesses; never inline because this is a slow-path! */
|
|
|
|
static noinline void kcsan_check_scoped_accesses(void)
|
|
|
|
{
|
|
|
|
struct kcsan_ctx *ctx = get_ctx();
|
|
|
|
struct kcsan_scoped_access *scoped_access;
|
|
|
|
|
2021-11-30 12:44:11 +01:00
|
|
|
if (ctx->disable_scoped)
|
|
|
|
return;
|
|
|
|
|
|
|
|
ctx->disable_scoped++;
|
2021-08-09 13:25:13 +02:00
|
|
|
list_for_each_entry(scoped_access, &ctx->scoped_accesses, list) {
|
|
|
|
check_access(scoped_access->ptr, scoped_access->size,
|
|
|
|
scoped_access->type, scoped_access->ip);
|
|
|
|
}
|
2021-11-30 12:44:11 +01:00
|
|
|
ctx->disable_scoped--;
|
kcsan: Add support for scoped accesses
This adds support for scoped accesses, where the memory range is checked
for the duration of the scope. The feature is implemented by inserting
the relevant access information into a list of scoped accesses for
the current execution context, which are then checked (until removed)
on every call (through instrumentation) into the KCSAN runtime.
An alternative, more complex, implementation could set up a watchpoint for
the scoped access, and keep the watchpoint set up. This, however, would
require first exposing a handle to the watchpoint, as well as dealing
with cases such as accesses by the same thread while the watchpoint is
still set up (and several more cases). It is also doubtful if this would
provide any benefit, since the majority of delay where the watchpoint
is set up is likely due to the injected delays by KCSAN. Therefore,
the implementation in this patch is simpler and avoids hurting KCSAN's
main use-case (normal data race detection); it also implicitly increases
scoped-access race-detection-ability due to increased probability of
setting up watchpoints by repeatedly calling __kcsan_check_access()
throughout the scope of the access.
The implementation required adding an additional conditional branch to
the fast-path. However, the microbenchmark showed a *speedup* of ~5%
on the fast-path. This appears to be due to subtly improved codegen by
GCC from moving get_ctx() and associated load of preempt_count earlier.
Suggested-by: Boqun Feng <boqun.feng@gmail.com>
Suggested-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-03-25 17:41:56 +01:00
|
|
|
}
|
|
|
|
|
2020-02-25 15:32:58 +01:00
|
|
|
/* Rules for generic atomic accesses. Called from fast-path. */
|
2020-02-04 18:21:10 +01:00
|
|
|
static __always_inline bool
|
2021-08-09 13:25:16 +02:00
|
|
|
is_atomic(struct kcsan_ctx *ctx, const volatile void *ptr, size_t size, int type)
|
2019-11-14 19:02:54 +01:00
|
|
|
{
|
2020-02-25 15:32:58 +01:00
|
|
|
if (type & KCSAN_ACCESS_ATOMIC)
|
2020-02-04 18:21:10 +01:00
|
|
|
return true;
|
2019-11-14 19:02:54 +01:00
|
|
|
|
kcsan: Introduce KCSAN_ACCESS_ASSERT access type
The KCSAN_ACCESS_ASSERT access type may be used to introduce dummy reads
and writes to assert certain properties of concurrent code, where bugs
could not be detected as normal data races.
For example, a variable that is only meant to be written by a single
CPU, but may be read (without locking) by other CPUs must still be
marked properly to avoid data races. However, concurrent writes,
regardless if WRITE_ONCE() or not, would be a bug. Using
kcsan_check_access(&x, sizeof(x), KCSAN_ACCESS_ASSERT) would allow
catching such bugs.
To support KCSAN_ACCESS_ASSERT the following notable changes were made:
* If an access is of type KCSAN_ASSERT_ACCESS, disable various filters
that only apply to data races, so that all races that KCSAN observes are
reported.
* Bug reports that involve an ASSERT access type will be reported as
"KCSAN: assert: race in ..." instead of "data-race"; this will help
more easily distinguish them.
* Update a few comments to just mention 'races' where we do not always
mean pure data races.
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2020-02-06 16:46:24 +01:00
|
|
|
/*
|
|
|
|
* Unless explicitly declared atomic, never consider an assertion access
|
|
|
|
* as atomic. This allows using them also in atomic regions, such as
|
|
|
|
* seqlocks, without implicitly changing their semantics.
|
|
|
|
*/
|
2020-02-25 15:32:58 +01:00
|
|
|
if (type & KCSAN_ACCESS_ASSERT)
|
kcsan: Introduce KCSAN_ACCESS_ASSERT access type
The KCSAN_ACCESS_ASSERT access type may be used to introduce dummy reads
and writes to assert certain properties of concurrent code, where bugs
could not be detected as normal data races.
For example, a variable that is only meant to be written by a single
CPU, but may be read (without locking) by other CPUs must still be
marked properly to avoid data races. However, concurrent writes,
regardless if WRITE_ONCE() or not, would be a bug. Using
kcsan_check_access(&x, sizeof(x), KCSAN_ACCESS_ASSERT) would allow
catching such bugs.
To support KCSAN_ACCESS_ASSERT the following notable changes were made:
* If an access is of type KCSAN_ASSERT_ACCESS, disable various filters
that only apply to data races, so that all races that KCSAN observes are
reported.
* Bug reports that involve an ASSERT access type will be reported as
"KCSAN: assert: race in ..." instead of "data-race"; this will help
more easily distinguish them.
* Update a few comments to just mention 'races' where we do not always
mean pure data races.
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2020-02-06 16:46:24 +01:00
|
|
|
return false;
|
|
|
|
|
2020-02-04 18:21:10 +01:00
|
|
|
if (IS_ENABLED(CONFIG_KCSAN_ASSUME_PLAIN_WRITES_ATOMIC) &&
|
2020-02-25 15:32:58 +01:00
|
|
|
(type & KCSAN_ACCESS_WRITE) && size <= sizeof(long) &&
|
kcsan: Support compounded read-write instrumentation
Add support for compounded read-write instrumentation if supported by
the compiler. Adds the necessary instrumentation functions, and a new
type which is used to generate a more descriptive report.
Furthermore, such compounded memory access instrumentation is excluded
from the "assume aligned writes up to word size are atomic" rule,
because we cannot assume that the compiler emits code that is atomic for
compound ops.
LLVM/Clang added support for the feature in:
https://github.com/llvm/llvm-project/commit/785d41a261d136b64ab6c15c5d35f2adc5ad53e3
The new instrumentation is emitted for sets of memory accesses in the
same basic block to the same address with at least one read appearing
before a write. These typically result from compound operations such as
++, --, +=, -=, |=, &=, etc. but also equivalent forms such as "var =
var + 1". Where the compiler determines that it is equivalent to emit a
call to a single __tsan_read_write instead of separate __tsan_read and
__tsan_write, we can then benefit from improved performance and better
reporting for such access patterns.
The new reports now show that the ops are both reads and writes, for
example:
read-write to 0xffffffff90548a38 of 8 bytes by task 143 on cpu 3:
test_kernel_rmw_array+0x45/0xa0
access_thread+0x71/0xb0
kthread+0x21e/0x240
ret_from_fork+0x22/0x30
read-write to 0xffffffff90548a38 of 8 bytes by task 144 on cpu 2:
test_kernel_rmw_array+0x45/0xa0
access_thread+0x71/0xb0
kthread+0x21e/0x240
ret_from_fork+0x22/0x30
Acked-by: Peter Zijlstra (Intel) <peterz@infradead.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-07-24 09:00:01 +02:00
|
|
|
!(type & KCSAN_ACCESS_COMPOUND) && IS_ALIGNED((unsigned long)ptr, size))
|
2020-02-04 18:21:10 +01:00
|
|
|
return true; /* Assume aligned writes up to word size are atomic. */
|
|
|
|
|
2020-02-25 15:32:58 +01:00
|
|
|
if (ctx->atomic_next > 0) {
|
2019-11-14 19:02:54 +01:00
|
|
|
/*
|
|
|
|
* Because we do not have separate contexts for nested
|
|
|
|
* interrupts, in case atomic_next is set, we simply assume that
|
|
|
|
* the outer interrupt set atomic_next. In the worst case, we
|
|
|
|
* will conservatively consider operations as atomic. This is a
|
|
|
|
* reasonable trade-off to make, since this case should be
|
|
|
|
* extremely rare; however, even if extremely rare, it could
|
|
|
|
* lead to false positives otherwise.
|
|
|
|
*/
|
|
|
|
if ((hardirq_count() >> HARDIRQ_SHIFT) < 2)
|
|
|
|
--ctx->atomic_next; /* in task, or outer interrupt */
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2020-02-25 15:32:58 +01:00
|
|
|
return ctx->atomic_nest_count > 0 || ctx->in_flat_atomic;
|
2019-11-14 19:02:54 +01:00
|
|
|
}
|
|
|
|
|
2020-02-04 18:21:10 +01:00
|
|
|
static __always_inline bool
|
2021-08-09 13:25:16 +02:00
|
|
|
should_watch(struct kcsan_ctx *ctx, const volatile void *ptr, size_t size, int type)
|
2019-11-14 19:02:54 +01:00
|
|
|
{
|
|
|
|
/*
|
|
|
|
* Never set up watchpoints when memory operations are atomic.
|
|
|
|
*
|
|
|
|
* Need to check this first, before kcsan_skip check below: (1) atomics
|
|
|
|
* should not count towards skipped instructions, and (2) to actually
|
|
|
|
* decrement kcsan_atomic_next for consecutive instruction stream.
|
|
|
|
*/
|
2021-08-09 13:25:16 +02:00
|
|
|
if (is_atomic(ctx, ptr, size, type))
|
2019-11-14 19:02:54 +01:00
|
|
|
return false;
|
|
|
|
|
|
|
|
if (this_cpu_dec_return(kcsan_skip) >= 0)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* NOTE: If we get here, kcsan_skip must always be reset in slow path
|
|
|
|
* via reset_kcsan_skip() to avoid underflow.
|
|
|
|
*/
|
|
|
|
|
|
|
|
/* this operation should be watched */
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2020-08-21 14:31:26 +02:00
|
|
|
/*
|
2020-11-24 12:02:09 +01:00
|
|
|
* Returns a pseudo-random number in interval [0, ep_ro). Simple linear
|
|
|
|
* congruential generator, using constants from "Numerical Recipes".
|
2020-08-21 14:31:26 +02:00
|
|
|
*/
|
|
|
|
static u32 kcsan_prandom_u32_max(u32 ep_ro)
|
|
|
|
{
|
2020-11-24 12:02:09 +01:00
|
|
|
u32 state = this_cpu_read(kcsan_rand_state);
|
|
|
|
|
|
|
|
state = 1664525 * state + 1013904223;
|
|
|
|
this_cpu_write(kcsan_rand_state, state);
|
2020-08-21 14:31:26 +02:00
|
|
|
|
2020-11-24 12:02:09 +01:00
|
|
|
return state % ep_ro;
|
2020-08-21 14:31:26 +02:00
|
|
|
}
|
|
|
|
|
2019-11-14 19:02:54 +01:00
|
|
|
static inline void reset_kcsan_skip(void)
|
|
|
|
{
|
2020-02-07 19:59:10 +01:00
|
|
|
long skip_count = kcsan_skip_watch -
|
2019-11-14 19:02:54 +01:00
|
|
|
(IS_ENABLED(CONFIG_KCSAN_SKIP_WATCH_RANDOMIZE) ?
|
2020-08-21 14:31:26 +02:00
|
|
|
kcsan_prandom_u32_max(kcsan_skip_watch) :
|
2019-11-14 19:02:54 +01:00
|
|
|
0);
|
|
|
|
this_cpu_write(kcsan_skip, skip_count);
|
|
|
|
}
|
|
|
|
|
2021-06-07 14:56:50 +02:00
|
|
|
static __always_inline bool kcsan_is_enabled(struct kcsan_ctx *ctx)
|
2019-11-14 19:02:54 +01:00
|
|
|
{
|
2021-06-07 14:56:50 +02:00
|
|
|
return READ_ONCE(kcsan_enabled) && !ctx->disable_count;
|
2019-11-14 19:02:54 +01:00
|
|
|
}
|
|
|
|
|
2020-08-21 14:31:26 +02:00
|
|
|
/* Introduce delay depending on context and configuration. */
|
|
|
|
static void delay_access(int type)
|
2019-11-14 19:02:54 +01:00
|
|
|
{
|
2020-02-07 19:59:10 +01:00
|
|
|
unsigned int delay = in_task() ? kcsan_udelay_task : kcsan_udelay_interrupt;
|
2020-07-24 09:00:03 +02:00
|
|
|
/* For certain access types, skew the random delay to be longer. */
|
|
|
|
unsigned int skew_delay_order =
|
|
|
|
(type & (KCSAN_ACCESS_COMPOUND | KCSAN_ACCESS_ASSERT)) ? 1 : 0;
|
|
|
|
|
2020-08-21 14:31:26 +02:00
|
|
|
delay -= IS_ENABLED(CONFIG_KCSAN_DELAY_RANDOMIZE) ?
|
|
|
|
kcsan_prandom_u32_max(delay >> skew_delay_order) :
|
|
|
|
0;
|
|
|
|
udelay(delay);
|
2019-11-14 19:02:54 +01:00
|
|
|
}
|
|
|
|
|
2021-11-30 12:44:09 +01:00
|
|
|
/*
|
|
|
|
* Reads the instrumented memory for value change detection; value change
|
|
|
|
* detection is currently done for accesses up to a size of 8 bytes.
|
|
|
|
*/
|
|
|
|
static __always_inline u64 read_instrumented_memory(const volatile void *ptr, size_t size)
|
|
|
|
{
|
|
|
|
switch (size) {
|
|
|
|
case 1: return READ_ONCE(*(const u8 *)ptr);
|
|
|
|
case 2: return READ_ONCE(*(const u16 *)ptr);
|
|
|
|
case 4: return READ_ONCE(*(const u32 *)ptr);
|
|
|
|
case 8: return READ_ONCE(*(const u64 *)ptr);
|
|
|
|
default: return 0; /* Ignore; we do not diff the values. */
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-07-29 13:09:16 +02:00
|
|
|
void kcsan_save_irqtrace(struct task_struct *task)
|
|
|
|
{
|
|
|
|
#ifdef CONFIG_TRACE_IRQFLAGS
|
|
|
|
task->kcsan_save_irqtrace = task->irqtrace;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
|
|
|
void kcsan_restore_irqtrace(struct task_struct *task)
|
|
|
|
{
|
|
|
|
#ifdef CONFIG_TRACE_IRQFLAGS
|
|
|
|
task->irqtrace = task->kcsan_save_irqtrace;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2021-08-05 14:57:45 +02:00
|
|
|
static __always_inline int get_kcsan_stack_depth(void)
|
|
|
|
{
|
|
|
|
#ifdef CONFIG_KCSAN_WEAK_MEMORY
|
|
|
|
return current->kcsan_stack_depth;
|
|
|
|
#else
|
|
|
|
BUILD_BUG();
|
|
|
|
return 0;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
|
|
|
static __always_inline void add_kcsan_stack_depth(int val)
|
|
|
|
{
|
|
|
|
#ifdef CONFIG_KCSAN_WEAK_MEMORY
|
|
|
|
current->kcsan_stack_depth += val;
|
|
|
|
#else
|
|
|
|
BUILD_BUG();
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
|
|
|
static __always_inline struct kcsan_scoped_access *get_reorder_access(struct kcsan_ctx *ctx)
|
|
|
|
{
|
|
|
|
#ifdef CONFIG_KCSAN_WEAK_MEMORY
|
|
|
|
return ctx->disable_scoped ? NULL : &ctx->reorder_access;
|
|
|
|
#else
|
|
|
|
return NULL;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
|
|
|
static __always_inline bool
|
|
|
|
find_reorder_access(struct kcsan_ctx *ctx, const volatile void *ptr, size_t size,
|
|
|
|
int type, unsigned long ip)
|
|
|
|
{
|
|
|
|
struct kcsan_scoped_access *reorder_access = get_reorder_access(ctx);
|
|
|
|
|
|
|
|
if (!reorder_access)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Note: If accesses are repeated while reorder_access is identical,
|
|
|
|
* never matches the new access, because !(type & KCSAN_ACCESS_SCOPED).
|
|
|
|
*/
|
|
|
|
return reorder_access->ptr == ptr && reorder_access->size == size &&
|
|
|
|
reorder_access->type == type && reorder_access->ip == ip;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void
|
|
|
|
set_reorder_access(struct kcsan_ctx *ctx, const volatile void *ptr, size_t size,
|
|
|
|
int type, unsigned long ip)
|
|
|
|
{
|
|
|
|
struct kcsan_scoped_access *reorder_access = get_reorder_access(ctx);
|
|
|
|
|
|
|
|
if (!reorder_access || !kcsan_weak_memory)
|
|
|
|
return;
|
|
|
|
|
kcsan: Avoid nested contexts reading inconsistent reorder_access
Nested contexts, such as nested interrupts or scheduler code, share the
same kcsan_ctx. When such a nested context reads an inconsistent
reorder_access due to an interrupt during set_reorder_access(), we can
observe the following warning:
| ------------[ cut here ]------------
| Cannot find frame for torture_random kernel/torture.c:456 in stack trace
| WARNING: CPU: 13 PID: 147 at kernel/kcsan/report.c:343 replace_stack_entry kernel/kcsan/report.c:343
| ...
| Call Trace:
| <TASK>
| sanitize_stack_entries kernel/kcsan/report.c:351 [inline]
| print_report kernel/kcsan/report.c:409
| kcsan_report_known_origin kernel/kcsan/report.c:693
| kcsan_setup_watchpoint kernel/kcsan/core.c:658
| rcutorture_one_extend kernel/rcu/rcutorture.c:1475
| rcutorture_loop_extend kernel/rcu/rcutorture.c:1558 [inline]
| ...
| </TASK>
| ---[ end trace ee5299cb933115f5 ]---
| ==================================================================
| BUG: KCSAN: data-race in _raw_spin_lock_irqsave / rcutorture_one_extend
|
| write (reordered) to 0xffffffff8c93b300 of 8 bytes by task 154 on cpu 12:
| queued_spin_lock include/asm-generic/qspinlock.h:80 [inline]
| do_raw_spin_lock include/linux/spinlock.h:185 [inline]
| __raw_spin_lock_irqsave include/linux/spinlock_api_smp.h:111 [inline]
| _raw_spin_lock_irqsave kernel/locking/spinlock.c:162
| try_to_wake_up kernel/sched/core.c:4003
| sysvec_apic_timer_interrupt arch/x86/kernel/apic/apic.c:1097
| asm_sysvec_apic_timer_interrupt arch/x86/include/asm/idtentry.h:638
| set_reorder_access kernel/kcsan/core.c:416 [inline] <-- inconsistent reorder_access
| kcsan_setup_watchpoint kernel/kcsan/core.c:693
| rcutorture_one_extend kernel/rcu/rcutorture.c:1475
| rcutorture_loop_extend kernel/rcu/rcutorture.c:1558 [inline]
| rcu_torture_one_read kernel/rcu/rcutorture.c:1600
| rcu_torture_reader kernel/rcu/rcutorture.c:1692
| kthread kernel/kthread.c:327
| ret_from_fork arch/x86/entry/entry_64.S:295
|
| read to 0xffffffff8c93b300 of 8 bytes by task 147 on cpu 13:
| rcutorture_one_extend kernel/rcu/rcutorture.c:1475
| rcutorture_loop_extend kernel/rcu/rcutorture.c:1558 [inline]
| ...
The warning is telling us that there was a data race which KCSAN wants
to report, but the function where the original access (that is now
reordered) happened cannot be found in the stack trace, which prevents
KCSAN from generating the right stack trace. The stack trace of "write
(reordered)" now only shows where the access was reordered to, but
should instead show the stack trace of the original write, with a final
line saying "reordered to".
At the point where set_reorder_access() is interrupted, it just set
reorder_access->ptr and size, at which point size is non-zero. This is
sufficient (if ctx->disable_scoped is zero) for further accesses from
nested contexts to perform checking of this reorder_access.
That then happened in _raw_spin_lock_irqsave(), which is called by
scheduler code. However, since reorder_access->ip is still stale (ptr
and size belong to a different ip not yet set) this finally leads to
replace_stack_entry() not finding the frame in reorder_access->ip and
generating the above warning.
Fix it by ensuring that a nested context cannot access reorder_access
while we update it in set_reorder_access(): set ctx->disable_scoped for
the duration that reorder_access is updated, which effectively locks
reorder_access and prevents concurrent use by nested contexts. Note,
set_reorder_access() can do the update only if disabled_scoped is zero
on entry, and must therefore set disable_scoped back to non-zero after
the initial check in set_reorder_access().
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2021-12-06 07:41:50 +01:00
|
|
|
/*
|
|
|
|
* To avoid nested interrupts or scheduler (which share kcsan_ctx)
|
|
|
|
* reading an inconsistent reorder_access, ensure that the below has
|
|
|
|
* exclusive access to reorder_access by disallowing concurrent use.
|
|
|
|
*/
|
|
|
|
ctx->disable_scoped++;
|
|
|
|
barrier();
|
2021-08-05 14:57:45 +02:00
|
|
|
reorder_access->ptr = ptr;
|
|
|
|
reorder_access->size = size;
|
|
|
|
reorder_access->type = type | KCSAN_ACCESS_SCOPED;
|
|
|
|
reorder_access->ip = ip;
|
|
|
|
reorder_access->stack_depth = get_kcsan_stack_depth();
|
kcsan: Avoid nested contexts reading inconsistent reorder_access
Nested contexts, such as nested interrupts or scheduler code, share the
same kcsan_ctx. When such a nested context reads an inconsistent
reorder_access due to an interrupt during set_reorder_access(), we can
observe the following warning:
| ------------[ cut here ]------------
| Cannot find frame for torture_random kernel/torture.c:456 in stack trace
| WARNING: CPU: 13 PID: 147 at kernel/kcsan/report.c:343 replace_stack_entry kernel/kcsan/report.c:343
| ...
| Call Trace:
| <TASK>
| sanitize_stack_entries kernel/kcsan/report.c:351 [inline]
| print_report kernel/kcsan/report.c:409
| kcsan_report_known_origin kernel/kcsan/report.c:693
| kcsan_setup_watchpoint kernel/kcsan/core.c:658
| rcutorture_one_extend kernel/rcu/rcutorture.c:1475
| rcutorture_loop_extend kernel/rcu/rcutorture.c:1558 [inline]
| ...
| </TASK>
| ---[ end trace ee5299cb933115f5 ]---
| ==================================================================
| BUG: KCSAN: data-race in _raw_spin_lock_irqsave / rcutorture_one_extend
|
| write (reordered) to 0xffffffff8c93b300 of 8 bytes by task 154 on cpu 12:
| queued_spin_lock include/asm-generic/qspinlock.h:80 [inline]
| do_raw_spin_lock include/linux/spinlock.h:185 [inline]
| __raw_spin_lock_irqsave include/linux/spinlock_api_smp.h:111 [inline]
| _raw_spin_lock_irqsave kernel/locking/spinlock.c:162
| try_to_wake_up kernel/sched/core.c:4003
| sysvec_apic_timer_interrupt arch/x86/kernel/apic/apic.c:1097
| asm_sysvec_apic_timer_interrupt arch/x86/include/asm/idtentry.h:638
| set_reorder_access kernel/kcsan/core.c:416 [inline] <-- inconsistent reorder_access
| kcsan_setup_watchpoint kernel/kcsan/core.c:693
| rcutorture_one_extend kernel/rcu/rcutorture.c:1475
| rcutorture_loop_extend kernel/rcu/rcutorture.c:1558 [inline]
| rcu_torture_one_read kernel/rcu/rcutorture.c:1600
| rcu_torture_reader kernel/rcu/rcutorture.c:1692
| kthread kernel/kthread.c:327
| ret_from_fork arch/x86/entry/entry_64.S:295
|
| read to 0xffffffff8c93b300 of 8 bytes by task 147 on cpu 13:
| rcutorture_one_extend kernel/rcu/rcutorture.c:1475
| rcutorture_loop_extend kernel/rcu/rcutorture.c:1558 [inline]
| ...
The warning is telling us that there was a data race which KCSAN wants
to report, but the function where the original access (that is now
reordered) happened cannot be found in the stack trace, which prevents
KCSAN from generating the right stack trace. The stack trace of "write
(reordered)" now only shows where the access was reordered to, but
should instead show the stack trace of the original write, with a final
line saying "reordered to".
At the point where set_reorder_access() is interrupted, it just set
reorder_access->ptr and size, at which point size is non-zero. This is
sufficient (if ctx->disable_scoped is zero) for further accesses from
nested contexts to perform checking of this reorder_access.
That then happened in _raw_spin_lock_irqsave(), which is called by
scheduler code. However, since reorder_access->ip is still stale (ptr
and size belong to a different ip not yet set) this finally leads to
replace_stack_entry() not finding the frame in reorder_access->ip and
generating the above warning.
Fix it by ensuring that a nested context cannot access reorder_access
while we update it in set_reorder_access(): set ctx->disable_scoped for
the duration that reorder_access is updated, which effectively locks
reorder_access and prevents concurrent use by nested contexts. Note,
set_reorder_access() can do the update only if disabled_scoped is zero
on entry, and must therefore set disable_scoped back to non-zero after
the initial check in set_reorder_access().
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2021-12-06 07:41:50 +01:00
|
|
|
barrier();
|
|
|
|
ctx->disable_scoped--;
|
2021-08-05 14:57:45 +02:00
|
|
|
}
|
|
|
|
|
2019-11-14 19:02:54 +01:00
|
|
|
/*
|
|
|
|
* Pull everything together: check_access() below contains the performance
|
|
|
|
* critical operations; the fast-path (including check_access) functions should
|
|
|
|
* all be inlinable by the instrumentation functions.
|
|
|
|
*
|
|
|
|
* The slow-path (kcsan_found_watchpoint, kcsan_setup_watchpoint) are
|
|
|
|
* non-inlinable -- note that, we prefix these with "kcsan_" to ensure they can
|
|
|
|
* be filtered from the stacktrace, as well as give them unique names for the
|
|
|
|
* UACCESS whitelist of objtool. Each function uses user_access_save/restore(),
|
|
|
|
* since they do not access any user memory, but instrumentation is still
|
|
|
|
* emitted in UACCESS regions.
|
|
|
|
*/
|
|
|
|
|
|
|
|
static noinline void kcsan_found_watchpoint(const volatile void *ptr,
|
2019-11-20 10:41:43 +01:00
|
|
|
size_t size,
|
2020-01-10 19:48:33 +01:00
|
|
|
int type,
|
2021-08-09 13:25:12 +02:00
|
|
|
unsigned long ip,
|
2019-11-14 19:02:54 +01:00
|
|
|
atomic_long_t *watchpoint,
|
|
|
|
long encoded_watchpoint)
|
|
|
|
{
|
2021-06-07 14:56:51 +02:00
|
|
|
const bool is_assert = (type & KCSAN_ACCESS_ASSERT) != 0;
|
2021-06-07 14:56:50 +02:00
|
|
|
struct kcsan_ctx *ctx = get_ctx();
|
2019-11-14 19:02:54 +01:00
|
|
|
unsigned long flags;
|
|
|
|
bool consumed;
|
|
|
|
|
2021-06-07 14:56:50 +02:00
|
|
|
/*
|
|
|
|
* We know a watchpoint exists. Let's try to keep the race-window
|
|
|
|
* between here and finally consuming the watchpoint below as small as
|
|
|
|
* possible -- avoid unneccessarily complex code until consumed.
|
|
|
|
*/
|
|
|
|
|
|
|
|
if (!kcsan_is_enabled(ctx))
|
2019-11-14 19:02:54 +01:00
|
|
|
return;
|
2020-02-11 17:04:22 +01:00
|
|
|
|
|
|
|
/*
|
|
|
|
* The access_mask check relies on value-change comparison. To avoid
|
|
|
|
* reporting a race where e.g. the writer set up the watchpoint, but the
|
|
|
|
* reader has access_mask!=0, we have to ignore the found watchpoint.
|
2021-08-05 14:57:45 +02:00
|
|
|
*
|
|
|
|
* reorder_access is never created from an access with access_mask set.
|
2020-02-11 17:04:22 +01:00
|
|
|
*/
|
2021-08-05 14:57:45 +02:00
|
|
|
if (ctx->access_mask && !find_reorder_access(ctx, ptr, size, type, ip))
|
2020-02-11 17:04:22 +01:00
|
|
|
return;
|
|
|
|
|
2021-06-07 14:56:51 +02:00
|
|
|
/*
|
|
|
|
* If the other thread does not want to ignore the access, and there was
|
|
|
|
* a value change as a result of this thread's operation, we will still
|
|
|
|
* generate a report of unknown origin.
|
|
|
|
*
|
|
|
|
* Use CONFIG_KCSAN_REPORT_RACE_UNKNOWN_ORIGIN=n to filter.
|
|
|
|
*/
|
|
|
|
if (!is_assert && kcsan_ignore_address(ptr))
|
|
|
|
return;
|
|
|
|
|
2019-11-14 19:02:54 +01:00
|
|
|
/*
|
2021-06-07 14:56:50 +02:00
|
|
|
* Consuming the watchpoint must be guarded by kcsan_is_enabled() to
|
|
|
|
* avoid erroneously triggering reports if the context is disabled.
|
2019-11-14 19:02:54 +01:00
|
|
|
*/
|
|
|
|
consumed = try_consume_watchpoint(watchpoint, encoded_watchpoint);
|
|
|
|
|
|
|
|
/* keep this after try_consume_watchpoint */
|
|
|
|
flags = user_access_save();
|
|
|
|
|
|
|
|
if (consumed) {
|
2020-07-29 13:09:16 +02:00
|
|
|
kcsan_save_irqtrace(current);
|
2021-08-09 13:25:12 +02:00
|
|
|
kcsan_report_set_info(ptr, size, type, ip, watchpoint - watchpoints);
|
2020-07-29 13:09:16 +02:00
|
|
|
kcsan_restore_irqtrace(current);
|
2019-11-14 19:02:54 +01:00
|
|
|
} else {
|
|
|
|
/*
|
|
|
|
* The other thread may not print any diagnostics, as it has
|
|
|
|
* already removed the watchpoint, or another thread consumed
|
|
|
|
* the watchpoint before this thread.
|
|
|
|
*/
|
2020-08-10 10:06:25 +02:00
|
|
|
atomic_long_inc(&kcsan_counters[KCSAN_COUNTER_REPORT_RACES]);
|
2019-11-14 19:02:54 +01:00
|
|
|
}
|
kcsan: Introduce KCSAN_ACCESS_ASSERT access type
The KCSAN_ACCESS_ASSERT access type may be used to introduce dummy reads
and writes to assert certain properties of concurrent code, where bugs
could not be detected as normal data races.
For example, a variable that is only meant to be written by a single
CPU, but may be read (without locking) by other CPUs must still be
marked properly to avoid data races. However, concurrent writes,
regardless if WRITE_ONCE() or not, would be a bug. Using
kcsan_check_access(&x, sizeof(x), KCSAN_ACCESS_ASSERT) would allow
catching such bugs.
To support KCSAN_ACCESS_ASSERT the following notable changes were made:
* If an access is of type KCSAN_ASSERT_ACCESS, disable various filters
that only apply to data races, so that all races that KCSAN observes are
reported.
* Bug reports that involve an ASSERT access type will be reported as
"KCSAN: assert: race in ..." instead of "data-race"; this will help
more easily distinguish them.
* Update a few comments to just mention 'races' where we do not always
mean pure data races.
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2020-02-06 16:46:24 +01:00
|
|
|
|
2021-06-07 14:56:51 +02:00
|
|
|
if (is_assert)
|
2020-08-10 10:06:25 +02:00
|
|
|
atomic_long_inc(&kcsan_counters[KCSAN_COUNTER_ASSERT_FAILURES]);
|
kcsan: Introduce KCSAN_ACCESS_ASSERT access type
The KCSAN_ACCESS_ASSERT access type may be used to introduce dummy reads
and writes to assert certain properties of concurrent code, where bugs
could not be detected as normal data races.
For example, a variable that is only meant to be written by a single
CPU, but may be read (without locking) by other CPUs must still be
marked properly to avoid data races. However, concurrent writes,
regardless if WRITE_ONCE() or not, would be a bug. Using
kcsan_check_access(&x, sizeof(x), KCSAN_ACCESS_ASSERT) would allow
catching such bugs.
To support KCSAN_ACCESS_ASSERT the following notable changes were made:
* If an access is of type KCSAN_ASSERT_ACCESS, disable various filters
that only apply to data races, so that all races that KCSAN observes are
reported.
* Bug reports that involve an ASSERT access type will be reported as
"KCSAN: assert: race in ..." instead of "data-race"; this will help
more easily distinguish them.
* Update a few comments to just mention 'races' where we do not always
mean pure data races.
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2020-02-06 16:46:24 +01:00
|
|
|
else
|
2020-08-10 10:06:25 +02:00
|
|
|
atomic_long_inc(&kcsan_counters[KCSAN_COUNTER_DATA_RACES]);
|
2019-11-14 19:02:54 +01:00
|
|
|
|
|
|
|
user_access_restore(flags);
|
|
|
|
}
|
|
|
|
|
2019-11-20 10:41:43 +01:00
|
|
|
static noinline void
|
2021-08-09 13:25:12 +02:00
|
|
|
kcsan_setup_watchpoint(const volatile void *ptr, size_t size, int type, unsigned long ip)
|
2019-11-14 19:02:54 +01:00
|
|
|
{
|
2020-01-10 19:48:33 +01:00
|
|
|
const bool is_write = (type & KCSAN_ACCESS_WRITE) != 0;
|
kcsan: Introduce KCSAN_ACCESS_ASSERT access type
The KCSAN_ACCESS_ASSERT access type may be used to introduce dummy reads
and writes to assert certain properties of concurrent code, where bugs
could not be detected as normal data races.
For example, a variable that is only meant to be written by a single
CPU, but may be read (without locking) by other CPUs must still be
marked properly to avoid data races. However, concurrent writes,
regardless if WRITE_ONCE() or not, would be a bug. Using
kcsan_check_access(&x, sizeof(x), KCSAN_ACCESS_ASSERT) would allow
catching such bugs.
To support KCSAN_ACCESS_ASSERT the following notable changes were made:
* If an access is of type KCSAN_ASSERT_ACCESS, disable various filters
that only apply to data races, so that all races that KCSAN observes are
reported.
* Bug reports that involve an ASSERT access type will be reported as
"KCSAN: assert: race in ..." instead of "data-race"; this will help
more easily distinguish them.
* Update a few comments to just mention 'races' where we do not always
mean pure data races.
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2020-02-06 16:46:24 +01:00
|
|
|
const bool is_assert = (type & KCSAN_ACCESS_ASSERT) != 0;
|
2019-11-14 19:02:54 +01:00
|
|
|
atomic_long_t *watchpoint;
|
2021-04-14 13:28:17 +02:00
|
|
|
u64 old, new, diff;
|
2020-02-11 17:04:21 +01:00
|
|
|
enum kcsan_value_change value_change = KCSAN_VALUE_CHANGE_MAYBE;
|
2021-08-05 14:57:45 +02:00
|
|
|
bool interrupt_watcher = kcsan_interrupt_watcher;
|
2019-11-14 19:02:54 +01:00
|
|
|
unsigned long ua_flags = user_access_save();
|
2021-06-07 14:56:50 +02:00
|
|
|
struct kcsan_ctx *ctx = get_ctx();
|
2021-08-05 14:57:45 +02:00
|
|
|
unsigned long access_mask = ctx->access_mask;
|
2020-02-21 23:02:09 +01:00
|
|
|
unsigned long irq_flags = 0;
|
2021-08-05 14:57:45 +02:00
|
|
|
bool is_reorder_access;
|
2019-11-14 19:02:54 +01:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Always reset kcsan_skip counter in slow-path to avoid underflow; see
|
|
|
|
* should_watch().
|
|
|
|
*/
|
|
|
|
reset_kcsan_skip();
|
|
|
|
|
2021-06-07 14:56:50 +02:00
|
|
|
if (!kcsan_is_enabled(ctx))
|
2019-11-14 19:02:54 +01:00
|
|
|
goto out;
|
|
|
|
|
2020-02-25 15:32:58 +01:00
|
|
|
/*
|
2021-06-07 14:56:51 +02:00
|
|
|
* Check to-ignore addresses after kcsan_is_enabled(), as we may access
|
|
|
|
* memory that is not yet initialized during early boot.
|
2020-02-25 15:32:58 +01:00
|
|
|
*/
|
2021-06-07 14:56:51 +02:00
|
|
|
if (!is_assert && kcsan_ignore_address(ptr))
|
2020-02-25 15:32:58 +01:00
|
|
|
goto out;
|
|
|
|
|
2019-11-14 19:02:54 +01:00
|
|
|
if (!check_encodable((unsigned long)ptr, size)) {
|
2020-08-10 10:06:25 +02:00
|
|
|
atomic_long_inc(&kcsan_counters[KCSAN_COUNTER_UNENCODABLE_ACCESSES]);
|
2019-11-14 19:02:54 +01:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
2021-08-05 14:57:45 +02:00
|
|
|
/*
|
|
|
|
* The local CPU cannot observe reordering of its own accesses, and
|
|
|
|
* therefore we need to take care of 2 cases to avoid false positives:
|
|
|
|
*
|
|
|
|
* 1. Races of the reordered access with interrupts. To avoid, if
|
|
|
|
* the current access is reorder_access, disable interrupts.
|
|
|
|
* 2. Avoid races of scoped accesses from nested interrupts (below).
|
|
|
|
*/
|
|
|
|
is_reorder_access = find_reorder_access(ctx, ptr, size, type, ip);
|
|
|
|
if (is_reorder_access)
|
|
|
|
interrupt_watcher = false;
|
2021-11-30 12:44:11 +01:00
|
|
|
/*
|
|
|
|
* Avoid races of scoped accesses from nested interrupts (or scheduler).
|
|
|
|
* Assume setting up a watchpoint for a non-scoped (normal) access that
|
|
|
|
* also conflicts with a current scoped access. In a nested interrupt,
|
|
|
|
* which shares the context, it would check a conflicting scoped access.
|
|
|
|
* To avoid, disable scoped access checking.
|
|
|
|
*/
|
|
|
|
ctx->disable_scoped++;
|
|
|
|
|
2020-07-29 13:09:16 +02:00
|
|
|
/*
|
|
|
|
* Save and restore the IRQ state trace touched by KCSAN, since KCSAN's
|
|
|
|
* runtime is entered for every memory access, and potentially useful
|
|
|
|
* information is lost if dirtied by KCSAN.
|
|
|
|
*/
|
|
|
|
kcsan_save_irqtrace(current);
|
2021-08-05 14:57:45 +02:00
|
|
|
if (!interrupt_watcher)
|
2020-06-24 13:32:46 +02:00
|
|
|
local_irq_save(irq_flags);
|
2019-11-14 19:02:54 +01:00
|
|
|
|
|
|
|
watchpoint = insert_watchpoint((unsigned long)ptr, size, is_write);
|
|
|
|
if (watchpoint == NULL) {
|
|
|
|
/*
|
2019-11-20 10:41:43 +01:00
|
|
|
* Out of capacity: the size of 'watchpoints', and the frequency
|
|
|
|
* with which should_watch() returns true should be tweaked so
|
2019-11-14 19:02:54 +01:00
|
|
|
* that this case happens very rarely.
|
|
|
|
*/
|
2020-08-10 10:06:25 +02:00
|
|
|
atomic_long_inc(&kcsan_counters[KCSAN_COUNTER_NO_CAPACITY]);
|
2019-11-14 19:02:54 +01:00
|
|
|
goto out_unlock;
|
|
|
|
}
|
|
|
|
|
2020-08-10 10:06:25 +02:00
|
|
|
atomic_long_inc(&kcsan_counters[KCSAN_COUNTER_SETUP_WATCHPOINTS]);
|
|
|
|
atomic_long_inc(&kcsan_counters[KCSAN_COUNTER_USED_WATCHPOINTS]);
|
2019-11-14 19:02:54 +01:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Read the current value, to later check and infer a race if the data
|
|
|
|
* was modified via a non-instrumented access, e.g. from a device.
|
|
|
|
*/
|
2021-08-05 14:57:45 +02:00
|
|
|
old = is_reorder_access ? 0 : read_instrumented_memory(ptr, size);
|
2019-11-14 19:02:54 +01:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Delay this thread, to increase probability of observing a racy
|
|
|
|
* conflicting access.
|
|
|
|
*/
|
2020-08-21 14:31:26 +02:00
|
|
|
delay_access(type);
|
2019-11-14 19:02:54 +01:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Re-read value, and check if it is as expected; if not, we infer a
|
|
|
|
* racy access.
|
|
|
|
*/
|
2021-08-05 14:57:45 +02:00
|
|
|
if (!is_reorder_access) {
|
|
|
|
new = read_instrumented_memory(ptr, size);
|
|
|
|
} else {
|
|
|
|
/*
|
|
|
|
* Reordered accesses cannot be used for value change detection,
|
|
|
|
* because the memory location may no longer be accessible and
|
|
|
|
* could result in a fault.
|
|
|
|
*/
|
|
|
|
new = 0;
|
|
|
|
access_mask = 0;
|
|
|
|
}
|
2019-11-14 19:02:54 +01:00
|
|
|
|
2021-04-14 13:28:17 +02:00
|
|
|
diff = old ^ new;
|
|
|
|
if (access_mask)
|
|
|
|
diff &= access_mask;
|
|
|
|
|
2021-06-07 14:56:51 +02:00
|
|
|
/*
|
|
|
|
* Check if we observed a value change.
|
|
|
|
*
|
|
|
|
* Also check if the data race should be ignored (the rules depend on
|
|
|
|
* non-zero diff); if it is to be ignored, the below rules for
|
|
|
|
* KCSAN_VALUE_CHANGE_MAYBE apply.
|
|
|
|
*/
|
|
|
|
if (diff && !kcsan_ignore_data_race(size, type, old, new, diff))
|
2020-02-11 17:04:21 +01:00
|
|
|
value_change = KCSAN_VALUE_CHANGE_TRUE;
|
|
|
|
|
2019-11-14 19:02:54 +01:00
|
|
|
/* Check if this access raced with another. */
|
kcsan: Avoid blocking producers in prepare_report()
To avoid deadlock in case watchers can be interrupted, we need to ensure
that producers of the struct other_info can never be blocked by an
unrelated consumer. (Likely to occur with KCSAN_INTERRUPT_WATCHER.)
There are several cases that can lead to this scenario, for example:
1. A watchpoint A was set up by task T1, but interrupted by
interrupt I1. Some other thread (task or interrupt) finds
watchpoint A consumes it, and sets other_info. Then I1 also
finds some unrelated watchpoint B, consumes it, but is blocked
because other_info is in use. T1 cannot consume other_info
because I1 never returns -> deadlock.
2. A watchpoint A was set up by task T1, but interrupted by
interrupt I1, which also sets up a watchpoint B. Some other
thread finds watchpoint A, and consumes it and sets up
other_info with its information. Similarly some other thread
finds watchpoint B and consumes it, but is then blocked because
other_info is in use. When I1 continues it sees its watchpoint
was consumed, and that it must wait for other_info, which
currently contains information to be consumed by T1. However, T1
cannot unblock other_info because I1 never returns -> deadlock.
To avoid this, we need to ensure that producers of struct other_info
always have a usable other_info entry. This is obviously not the case
with only a single instance of struct other_info, as concurrent
producers must wait for the entry to be released by some consumer (which
may be locked up as illustrated above).
While it would be nice if producers could simply call kmalloc() and
append their instance of struct other_info to a list, we are very
limited in this code path: since KCSAN can instrument the allocators
themselves, calling kmalloc() could lead to deadlock or corrupted
allocator state.
Since producers of the struct other_info will always succeed at
try_consume_watchpoint(), preceding the call into kcsan_report(), we
know that the particular watchpoint slot cannot simply be reused or
consumed by another potential other_info producer. If we move removal of
a watchpoint after reporting (by the consumer of struct other_info), we
can see a consumed watchpoint as a held lock on elements of other_info,
if we create a one-to-one mapping of a watchpoint to an other_info
element.
Therefore, the simplest solution is to create an array of struct
other_info that is as large as the watchpoints array in core.c, and pass
the watchpoint index to kcsan_report() for producers and consumers, and
change watchpoints to be removed after reporting is done.
With a default config on a 64-bit system, the array other_infos consumes
~37KiB. For most systems today this is not a problem. On smaller memory
constrained systems, the config value CONFIG_KCSAN_NUM_WATCHPOINTS can
be reduced appropriately.
Overall, this change is a simplification of the prepare_report() code,
and makes some of the checks (such as checking if at least one access is
a write) redundant.
Tested:
$ tools/testing/selftests/rcutorture/bin/kvm.sh \
--cpus 12 --duration 10 --kconfig "CONFIG_DEBUG_INFO=y \
CONFIG_KCSAN=y CONFIG_KCSAN_ASSUME_PLAIN_WRITES_ATOMIC=n \
CONFIG_KCSAN_REPORT_VALUE_CHANGE_ONLY=n \
CONFIG_KCSAN_REPORT_ONCE_IN_MS=100000 CONFIG_KCSAN_VERBOSE=y \
CONFIG_KCSAN_INTERRUPT_WATCHER=y CONFIG_PROVE_LOCKING=y" \
--configs TREE03
=> No longer hangs and runs to completion as expected.
Reported-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-03-18 18:38:45 +01:00
|
|
|
if (!consume_watchpoint(watchpoint)) {
|
2020-02-11 17:04:21 +01:00
|
|
|
/*
|
|
|
|
* Depending on the access type, map a value_change of MAYBE to
|
2020-02-11 17:04:22 +01:00
|
|
|
* TRUE (always report) or FALSE (never report).
|
2020-02-11 17:04:21 +01:00
|
|
|
*/
|
2020-02-11 17:04:22 +01:00
|
|
|
if (value_change == KCSAN_VALUE_CHANGE_MAYBE) {
|
|
|
|
if (access_mask != 0) {
|
|
|
|
/*
|
|
|
|
* For access with access_mask, we require a
|
|
|
|
* value-change, as it is likely that races on
|
|
|
|
* ~access_mask bits are expected.
|
|
|
|
*/
|
|
|
|
value_change = KCSAN_VALUE_CHANGE_FALSE;
|
|
|
|
} else if (size > 8 || is_assert) {
|
|
|
|
/* Always assume a value-change. */
|
|
|
|
value_change = KCSAN_VALUE_CHANGE_TRUE;
|
|
|
|
}
|
2020-02-11 17:04:21 +01:00
|
|
|
}
|
|
|
|
|
2019-11-14 19:02:54 +01:00
|
|
|
/*
|
|
|
|
* No need to increment 'data_races' counter, as the racing
|
|
|
|
* thread already did.
|
kcsan: Introduce KCSAN_ACCESS_ASSERT access type
The KCSAN_ACCESS_ASSERT access type may be used to introduce dummy reads
and writes to assert certain properties of concurrent code, where bugs
could not be detected as normal data races.
For example, a variable that is only meant to be written by a single
CPU, but may be read (without locking) by other CPUs must still be
marked properly to avoid data races. However, concurrent writes,
regardless if WRITE_ONCE() or not, would be a bug. Using
kcsan_check_access(&x, sizeof(x), KCSAN_ACCESS_ASSERT) would allow
catching such bugs.
To support KCSAN_ACCESS_ASSERT the following notable changes were made:
* If an access is of type KCSAN_ASSERT_ACCESS, disable various filters
that only apply to data races, so that all races that KCSAN observes are
reported.
* Bug reports that involve an ASSERT access type will be reported as
"KCSAN: assert: race in ..." instead of "data-race"; this will help
more easily distinguish them.
* Update a few comments to just mention 'races' where we do not always
mean pure data races.
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2020-02-06 16:46:24 +01:00
|
|
|
*
|
|
|
|
* Count 'assert_failures' for each failed ASSERT access,
|
|
|
|
* therefore both this thread and the racing thread may
|
|
|
|
* increment this counter.
|
2019-11-14 19:02:54 +01:00
|
|
|
*/
|
2020-02-11 17:04:21 +01:00
|
|
|
if (is_assert && value_change == KCSAN_VALUE_CHANGE_TRUE)
|
2020-08-10 10:06:25 +02:00
|
|
|
atomic_long_inc(&kcsan_counters[KCSAN_COUNTER_ASSERT_FAILURES]);
|
kcsan: Introduce KCSAN_ACCESS_ASSERT access type
The KCSAN_ACCESS_ASSERT access type may be used to introduce dummy reads
and writes to assert certain properties of concurrent code, where bugs
could not be detected as normal data races.
For example, a variable that is only meant to be written by a single
CPU, but may be read (without locking) by other CPUs must still be
marked properly to avoid data races. However, concurrent writes,
regardless if WRITE_ONCE() or not, would be a bug. Using
kcsan_check_access(&x, sizeof(x), KCSAN_ACCESS_ASSERT) would allow
catching such bugs.
To support KCSAN_ACCESS_ASSERT the following notable changes were made:
* If an access is of type KCSAN_ASSERT_ACCESS, disable various filters
that only apply to data races, so that all races that KCSAN observes are
reported.
* Bug reports that involve an ASSERT access type will be reported as
"KCSAN: assert: race in ..." instead of "data-race"; this will help
more easily distinguish them.
* Update a few comments to just mention 'races' where we do not always
mean pure data races.
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2020-02-06 16:46:24 +01:00
|
|
|
|
2021-08-09 13:25:12 +02:00
|
|
|
kcsan_report_known_origin(ptr, size, type, ip,
|
|
|
|
value_change, watchpoint - watchpoints,
|
kcsan: Report observed value changes
When a thread detects that a memory location was modified without its
watchpoint being hit, the report notes that a change was detected, but
does not provide concrete values for the change. Knowing the concrete
values can be very helpful in tracking down any racy writers (e.g. as
specific values may only be written in some portions of code, or under
certain conditions).
When we detect a modification, let's report the concrete old/new values,
along with the access's mask of relevant bits (and which relevant bits
were modified). This can make it easier to identify potential racy
writers. As the snapshots are at most 8 bytes, we can only report values
for acceses up to this size, but this appears to cater for the common
case.
When we detect a race via a watchpoint, we may or may not have concrete
values for the modification. To be helpful, let's attempt to log them
when we do as they can be ignored where irrelevant.
The resulting reports appears as follows, with values zero-padded to the
access width:
| ==================================================================
| BUG: KCSAN: data-race in el0_svc_common+0x34/0x25c arch/arm64/kernel/syscall.c:96
|
| race at unknown origin, with read to 0xffff00007ae6aa00 of 8 bytes by task 223 on cpu 1:
| el0_svc_common+0x34/0x25c arch/arm64/kernel/syscall.c:96
| do_el0_svc+0x48/0xec arch/arm64/kernel/syscall.c:178
| el0_svc arch/arm64/kernel/entry-common.c:226 [inline]
| el0_sync_handler+0x1a4/0x390 arch/arm64/kernel/entry-common.c:236
| el0_sync+0x140/0x180 arch/arm64/kernel/entry.S:674
|
| value changed: 0x0000000000000000 -> 0x0000000000000002
|
| Reported by Kernel Concurrency Sanitizer on:
| CPU: 1 PID: 223 Comm: syz-executor.1 Not tainted 5.8.0-rc3-00094-ga73f923ecc8e-dirty #3
| Hardware name: linux,dummy-virt (DT)
| ==================================================================
If an access mask is set, it is shown underneath the "value changed"
line as "bits changed: 0x<bits changed> with mask 0x<non-zero mask>".
Signed-off-by: Mark Rutland <mark.rutland@arm.com>
[ elver@google.com: align "value changed" and "bits changed" lines,
which required massaging the message; do not print bits+mask if no
mask set. ]
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2021-04-14 13:28:24 +02:00
|
|
|
old, new, access_mask);
|
2020-02-11 17:04:21 +01:00
|
|
|
} else if (value_change == KCSAN_VALUE_CHANGE_TRUE) {
|
2019-11-14 19:02:54 +01:00
|
|
|
/* Inferring a race, since the value should not have changed. */
|
kcsan: Introduce KCSAN_ACCESS_ASSERT access type
The KCSAN_ACCESS_ASSERT access type may be used to introduce dummy reads
and writes to assert certain properties of concurrent code, where bugs
could not be detected as normal data races.
For example, a variable that is only meant to be written by a single
CPU, but may be read (without locking) by other CPUs must still be
marked properly to avoid data races. However, concurrent writes,
regardless if WRITE_ONCE() or not, would be a bug. Using
kcsan_check_access(&x, sizeof(x), KCSAN_ACCESS_ASSERT) would allow
catching such bugs.
To support KCSAN_ACCESS_ASSERT the following notable changes were made:
* If an access is of type KCSAN_ASSERT_ACCESS, disable various filters
that only apply to data races, so that all races that KCSAN observes are
reported.
* Bug reports that involve an ASSERT access type will be reported as
"KCSAN: assert: race in ..." instead of "data-race"; this will help
more easily distinguish them.
* Update a few comments to just mention 'races' where we do not always
mean pure data races.
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2020-02-06 16:46:24 +01:00
|
|
|
|
2020-08-10 10:06:25 +02:00
|
|
|
atomic_long_inc(&kcsan_counters[KCSAN_COUNTER_RACES_UNKNOWN_ORIGIN]);
|
kcsan: Introduce KCSAN_ACCESS_ASSERT access type
The KCSAN_ACCESS_ASSERT access type may be used to introduce dummy reads
and writes to assert certain properties of concurrent code, where bugs
could not be detected as normal data races.
For example, a variable that is only meant to be written by a single
CPU, but may be read (without locking) by other CPUs must still be
marked properly to avoid data races. However, concurrent writes,
regardless if WRITE_ONCE() or not, would be a bug. Using
kcsan_check_access(&x, sizeof(x), KCSAN_ACCESS_ASSERT) would allow
catching such bugs.
To support KCSAN_ACCESS_ASSERT the following notable changes were made:
* If an access is of type KCSAN_ASSERT_ACCESS, disable various filters
that only apply to data races, so that all races that KCSAN observes are
reported.
* Bug reports that involve an ASSERT access type will be reported as
"KCSAN: assert: race in ..." instead of "data-race"; this will help
more easily distinguish them.
* Update a few comments to just mention 'races' where we do not always
mean pure data races.
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2020-02-06 16:46:24 +01:00
|
|
|
if (is_assert)
|
2020-08-10 10:06:25 +02:00
|
|
|
atomic_long_inc(&kcsan_counters[KCSAN_COUNTER_ASSERT_FAILURES]);
|
kcsan: Introduce KCSAN_ACCESS_ASSERT access type
The KCSAN_ACCESS_ASSERT access type may be used to introduce dummy reads
and writes to assert certain properties of concurrent code, where bugs
could not be detected as normal data races.
For example, a variable that is only meant to be written by a single
CPU, but may be read (without locking) by other CPUs must still be
marked properly to avoid data races. However, concurrent writes,
regardless if WRITE_ONCE() or not, would be a bug. Using
kcsan_check_access(&x, sizeof(x), KCSAN_ACCESS_ASSERT) would allow
catching such bugs.
To support KCSAN_ACCESS_ASSERT the following notable changes were made:
* If an access is of type KCSAN_ASSERT_ACCESS, disable various filters
that only apply to data races, so that all races that KCSAN observes are
reported.
* Bug reports that involve an ASSERT access type will be reported as
"KCSAN: assert: race in ..." instead of "data-race"; this will help
more easily distinguish them.
* Update a few comments to just mention 'races' where we do not always
mean pure data races.
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2020-02-06 16:46:24 +01:00
|
|
|
|
2021-08-09 13:25:12 +02:00
|
|
|
if (IS_ENABLED(CONFIG_KCSAN_REPORT_RACE_UNKNOWN_ORIGIN) || is_assert) {
|
|
|
|
kcsan_report_unknown_origin(ptr, size, type, ip,
|
|
|
|
old, new, access_mask);
|
|
|
|
}
|
2019-11-14 19:02:54 +01:00
|
|
|
}
|
|
|
|
|
kcsan: Avoid blocking producers in prepare_report()
To avoid deadlock in case watchers can be interrupted, we need to ensure
that producers of the struct other_info can never be blocked by an
unrelated consumer. (Likely to occur with KCSAN_INTERRUPT_WATCHER.)
There are several cases that can lead to this scenario, for example:
1. A watchpoint A was set up by task T1, but interrupted by
interrupt I1. Some other thread (task or interrupt) finds
watchpoint A consumes it, and sets other_info. Then I1 also
finds some unrelated watchpoint B, consumes it, but is blocked
because other_info is in use. T1 cannot consume other_info
because I1 never returns -> deadlock.
2. A watchpoint A was set up by task T1, but interrupted by
interrupt I1, which also sets up a watchpoint B. Some other
thread finds watchpoint A, and consumes it and sets up
other_info with its information. Similarly some other thread
finds watchpoint B and consumes it, but is then blocked because
other_info is in use. When I1 continues it sees its watchpoint
was consumed, and that it must wait for other_info, which
currently contains information to be consumed by T1. However, T1
cannot unblock other_info because I1 never returns -> deadlock.
To avoid this, we need to ensure that producers of struct other_info
always have a usable other_info entry. This is obviously not the case
with only a single instance of struct other_info, as concurrent
producers must wait for the entry to be released by some consumer (which
may be locked up as illustrated above).
While it would be nice if producers could simply call kmalloc() and
append their instance of struct other_info to a list, we are very
limited in this code path: since KCSAN can instrument the allocators
themselves, calling kmalloc() could lead to deadlock or corrupted
allocator state.
Since producers of the struct other_info will always succeed at
try_consume_watchpoint(), preceding the call into kcsan_report(), we
know that the particular watchpoint slot cannot simply be reused or
consumed by another potential other_info producer. If we move removal of
a watchpoint after reporting (by the consumer of struct other_info), we
can see a consumed watchpoint as a held lock on elements of other_info,
if we create a one-to-one mapping of a watchpoint to an other_info
element.
Therefore, the simplest solution is to create an array of struct
other_info that is as large as the watchpoints array in core.c, and pass
the watchpoint index to kcsan_report() for producers and consumers, and
change watchpoints to be removed after reporting is done.
With a default config on a 64-bit system, the array other_infos consumes
~37KiB. For most systems today this is not a problem. On smaller memory
constrained systems, the config value CONFIG_KCSAN_NUM_WATCHPOINTS can
be reduced appropriately.
Overall, this change is a simplification of the prepare_report() code,
and makes some of the checks (such as checking if at least one access is
a write) redundant.
Tested:
$ tools/testing/selftests/rcutorture/bin/kvm.sh \
--cpus 12 --duration 10 --kconfig "CONFIG_DEBUG_INFO=y \
CONFIG_KCSAN=y CONFIG_KCSAN_ASSUME_PLAIN_WRITES_ATOMIC=n \
CONFIG_KCSAN_REPORT_VALUE_CHANGE_ONLY=n \
CONFIG_KCSAN_REPORT_ONCE_IN_MS=100000 CONFIG_KCSAN_VERBOSE=y \
CONFIG_KCSAN_INTERRUPT_WATCHER=y CONFIG_PROVE_LOCKING=y" \
--configs TREE03
=> No longer hangs and runs to completion as expected.
Reported-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-03-18 18:38:45 +01:00
|
|
|
/*
|
|
|
|
* Remove watchpoint; must be after reporting, since the slot may be
|
|
|
|
* reused after this point.
|
|
|
|
*/
|
|
|
|
remove_watchpoint(watchpoint);
|
2020-08-10 10:06:25 +02:00
|
|
|
atomic_long_dec(&kcsan_counters[KCSAN_COUNTER_USED_WATCHPOINTS]);
|
2021-08-05 14:57:45 +02:00
|
|
|
|
2019-11-14 19:02:54 +01:00
|
|
|
out_unlock:
|
2021-08-05 14:57:45 +02:00
|
|
|
if (!interrupt_watcher)
|
2020-06-24 13:32:46 +02:00
|
|
|
local_irq_restore(irq_flags);
|
2020-07-29 13:09:16 +02:00
|
|
|
kcsan_restore_irqtrace(current);
|
2021-11-30 12:44:11 +01:00
|
|
|
ctx->disable_scoped--;
|
2021-08-05 14:57:45 +02:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Reordered accesses cannot be used for value change detection,
|
|
|
|
* therefore never consider for reordering if access_mask is set.
|
|
|
|
* ASSERT_EXCLUSIVE are not real accesses, ignore them as well.
|
|
|
|
*/
|
|
|
|
if (!access_mask && !is_assert)
|
|
|
|
set_reorder_access(ctx, ptr, size, type, ip);
|
2019-11-14 19:02:54 +01:00
|
|
|
out:
|
|
|
|
user_access_restore(ua_flags);
|
|
|
|
}
|
|
|
|
|
2021-08-09 13:25:12 +02:00
|
|
|
static __always_inline void
|
|
|
|
check_access(const volatile void *ptr, size_t size, int type, unsigned long ip)
|
2019-11-14 19:02:54 +01:00
|
|
|
{
|
|
|
|
atomic_long_t *watchpoint;
|
|
|
|
long encoded_watchpoint;
|
|
|
|
|
2020-02-05 11:14:19 +01:00
|
|
|
/*
|
|
|
|
* Do nothing for 0 sized check; this comparison will be optimized out
|
|
|
|
* for constant sized instrumentation (__tsan_{read,write}N).
|
|
|
|
*/
|
|
|
|
if (unlikely(size == 0))
|
|
|
|
return;
|
|
|
|
|
2021-08-05 14:57:45 +02:00
|
|
|
again:
|
2019-11-14 19:02:54 +01:00
|
|
|
/*
|
|
|
|
* Avoid user_access_save in fast-path: find_watchpoint is safe without
|
|
|
|
* user_access_save, as the address that ptr points to is only used to
|
|
|
|
* check if a watchpoint exists; ptr is never dereferenced.
|
|
|
|
*/
|
2021-08-05 14:57:45 +02:00
|
|
|
watchpoint = find_watchpoint((unsigned long)ptr, size,
|
|
|
|
!(type & KCSAN_ACCESS_WRITE),
|
2019-11-14 19:02:54 +01:00
|
|
|
&encoded_watchpoint);
|
|
|
|
/*
|
|
|
|
* It is safe to check kcsan_is_enabled() after find_watchpoint in the
|
kcsan: Introduce KCSAN_ACCESS_ASSERT access type
The KCSAN_ACCESS_ASSERT access type may be used to introduce dummy reads
and writes to assert certain properties of concurrent code, where bugs
could not be detected as normal data races.
For example, a variable that is only meant to be written by a single
CPU, but may be read (without locking) by other CPUs must still be
marked properly to avoid data races. However, concurrent writes,
regardless if WRITE_ONCE() or not, would be a bug. Using
kcsan_check_access(&x, sizeof(x), KCSAN_ACCESS_ASSERT) would allow
catching such bugs.
To support KCSAN_ACCESS_ASSERT the following notable changes were made:
* If an access is of type KCSAN_ASSERT_ACCESS, disable various filters
that only apply to data races, so that all races that KCSAN observes are
reported.
* Bug reports that involve an ASSERT access type will be reported as
"KCSAN: assert: race in ..." instead of "data-race"; this will help
more easily distinguish them.
* Update a few comments to just mention 'races' where we do not always
mean pure data races.
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2020-02-06 16:46:24 +01:00
|
|
|
* slow-path, as long as no state changes that cause a race to be
|
2019-11-14 19:02:54 +01:00
|
|
|
* detected and reported have occurred until kcsan_is_enabled() is
|
|
|
|
* checked.
|
|
|
|
*/
|
|
|
|
|
|
|
|
if (unlikely(watchpoint != NULL))
|
2021-08-09 13:25:12 +02:00
|
|
|
kcsan_found_watchpoint(ptr, size, type, ip, watchpoint, encoded_watchpoint);
|
kcsan: Add support for scoped accesses
This adds support for scoped accesses, where the memory range is checked
for the duration of the scope. The feature is implemented by inserting
the relevant access information into a list of scoped accesses for
the current execution context, which are then checked (until removed)
on every call (through instrumentation) into the KCSAN runtime.
An alternative, more complex, implementation could set up a watchpoint for
the scoped access, and keep the watchpoint set up. This, however, would
require first exposing a handle to the watchpoint, as well as dealing
with cases such as accesses by the same thread while the watchpoint is
still set up (and several more cases). It is also doubtful if this would
provide any benefit, since the majority of delay where the watchpoint
is set up is likely due to the injected delays by KCSAN. Therefore,
the implementation in this patch is simpler and avoids hurting KCSAN's
main use-case (normal data race detection); it also implicitly increases
scoped-access race-detection-ability due to increased probability of
setting up watchpoints by repeatedly calling __kcsan_check_access()
throughout the scope of the access.
The implementation required adding an additional conditional branch to
the fast-path. However, the microbenchmark showed a *speedup* of ~5%
on the fast-path. This appears to be due to subtly improved codegen by
GCC from moving get_ctx() and associated load of preempt_count earlier.
Suggested-by: Boqun Feng <boqun.feng@gmail.com>
Suggested-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-03-25 17:41:56 +01:00
|
|
|
else {
|
|
|
|
struct kcsan_ctx *ctx = get_ctx(); /* Call only once in fast-path. */
|
|
|
|
|
2021-08-05 14:57:45 +02:00
|
|
|
if (unlikely(should_watch(ctx, ptr, size, type))) {
|
2021-08-09 13:25:12 +02:00
|
|
|
kcsan_setup_watchpoint(ptr, size, type, ip);
|
2021-08-05 14:57:45 +02:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!(type & KCSAN_ACCESS_SCOPED)) {
|
|
|
|
struct kcsan_scoped_access *reorder_access = get_reorder_access(ctx);
|
|
|
|
|
|
|
|
if (reorder_access) {
|
|
|
|
/*
|
|
|
|
* reorder_access check: simulates reordering of
|
|
|
|
* the access after subsequent operations.
|
|
|
|
*/
|
|
|
|
ptr = reorder_access->ptr;
|
|
|
|
type = reorder_access->type;
|
|
|
|
ip = reorder_access->ip;
|
|
|
|
/*
|
|
|
|
* Upon a nested interrupt, this context's
|
|
|
|
* reorder_access can be modified (shared ctx).
|
|
|
|
* We know that upon return, reorder_access is
|
|
|
|
* always invalidated by setting size to 0 via
|
|
|
|
* __tsan_func_exit(). Therefore we must read
|
|
|
|
* and check size after the other fields.
|
|
|
|
*/
|
|
|
|
barrier();
|
|
|
|
size = READ_ONCE(reorder_access->size);
|
|
|
|
if (size)
|
|
|
|
goto again;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Always checked last, right before returning from runtime;
|
|
|
|
* if reorder_access is valid, checked after it was checked.
|
|
|
|
*/
|
|
|
|
if (unlikely(ctx->scoped_accesses.prev))
|
kcsan: Add support for scoped accesses
This adds support for scoped accesses, where the memory range is checked
for the duration of the scope. The feature is implemented by inserting
the relevant access information into a list of scoped accesses for
the current execution context, which are then checked (until removed)
on every call (through instrumentation) into the KCSAN runtime.
An alternative, more complex, implementation could set up a watchpoint for
the scoped access, and keep the watchpoint set up. This, however, would
require first exposing a handle to the watchpoint, as well as dealing
with cases such as accesses by the same thread while the watchpoint is
still set up (and several more cases). It is also doubtful if this would
provide any benefit, since the majority of delay where the watchpoint
is set up is likely due to the injected delays by KCSAN. Therefore,
the implementation in this patch is simpler and avoids hurting KCSAN's
main use-case (normal data race detection); it also implicitly increases
scoped-access race-detection-ability due to increased probability of
setting up watchpoints by repeatedly calling __kcsan_check_access()
throughout the scope of the access.
The implementation required adding an additional conditional branch to
the fast-path. However, the microbenchmark showed a *speedup* of ~5%
on the fast-path. This appears to be due to subtly improved codegen by
GCC from moving get_ctx() and associated load of preempt_count earlier.
Suggested-by: Boqun Feng <boqun.feng@gmail.com>
Suggested-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-03-25 17:41:56 +01:00
|
|
|
kcsan_check_scoped_accesses();
|
|
|
|
}
|
2019-11-14 19:02:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
/* === Public interface ===================================================== */
|
|
|
|
|
|
|
|
void __init kcsan_init(void)
|
|
|
|
{
|
2020-11-24 12:02:09 +01:00
|
|
|
int cpu;
|
|
|
|
|
2019-11-14 19:02:54 +01:00
|
|
|
BUG_ON(!in_task());
|
|
|
|
|
2020-11-24 12:02:09 +01:00
|
|
|
for_each_possible_cpu(cpu)
|
|
|
|
per_cpu(kcsan_rand_state, cpu) = (u32)get_cycles();
|
2019-11-14 19:02:54 +01:00
|
|
|
|
|
|
|
/*
|
|
|
|
* We are in the init task, and no other tasks should be running;
|
|
|
|
* WRITE_ONCE without memory barrier is sufficient.
|
|
|
|
*/
|
2020-07-31 10:17:22 +02:00
|
|
|
if (kcsan_early_enable) {
|
|
|
|
pr_info("enabled early\n");
|
2019-11-14 19:02:54 +01:00
|
|
|
WRITE_ONCE(kcsan_enabled, true);
|
2020-07-31 10:17:22 +02:00
|
|
|
}
|
2021-06-07 14:56:52 +02:00
|
|
|
|
|
|
|
if (IS_ENABLED(CONFIG_KCSAN_REPORT_VALUE_CHANGE_ONLY) ||
|
|
|
|
IS_ENABLED(CONFIG_KCSAN_ASSUME_PLAIN_WRITES_ATOMIC) ||
|
|
|
|
IS_ENABLED(CONFIG_KCSAN_PERMISSIVE) ||
|
|
|
|
IS_ENABLED(CONFIG_KCSAN_IGNORE_ATOMICS)) {
|
|
|
|
pr_warn("non-strict mode configured - use CONFIG_KCSAN_STRICT=y to see all data races\n");
|
|
|
|
} else {
|
|
|
|
pr_info("strict mode configured\n");
|
|
|
|
}
|
2019-11-14 19:02:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
/* === Exported interface =================================================== */
|
|
|
|
|
|
|
|
void kcsan_disable_current(void)
|
|
|
|
{
|
|
|
|
++get_ctx()->disable_count;
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kcsan_disable_current);
|
|
|
|
|
|
|
|
void kcsan_enable_current(void)
|
|
|
|
{
|
|
|
|
if (get_ctx()->disable_count-- == 0) {
|
|
|
|
/*
|
|
|
|
* Warn if kcsan_enable_current() calls are unbalanced with
|
|
|
|
* kcsan_disable_current() calls, which causes disable_count to
|
|
|
|
* become negative and should not happen.
|
|
|
|
*/
|
|
|
|
kcsan_disable_current(); /* restore to 0, KCSAN still enabled */
|
|
|
|
kcsan_disable_current(); /* disable to generate warning */
|
|
|
|
WARN(1, "Unbalanced %s()", __func__);
|
|
|
|
kcsan_enable_current();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kcsan_enable_current);
|
|
|
|
|
2020-04-24 17:47:29 +02:00
|
|
|
void kcsan_enable_current_nowarn(void)
|
|
|
|
{
|
|
|
|
if (get_ctx()->disable_count-- == 0)
|
|
|
|
kcsan_disable_current();
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kcsan_enable_current_nowarn);
|
|
|
|
|
2019-11-14 19:02:54 +01:00
|
|
|
void kcsan_nestable_atomic_begin(void)
|
|
|
|
{
|
|
|
|
/*
|
|
|
|
* Do *not* check and warn if we are in a flat atomic region: nestable
|
|
|
|
* and flat atomic regions are independent from each other.
|
|
|
|
* See include/linux/kcsan.h: struct kcsan_ctx comments for more
|
|
|
|
* comments.
|
|
|
|
*/
|
|
|
|
|
|
|
|
++get_ctx()->atomic_nest_count;
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kcsan_nestable_atomic_begin);
|
|
|
|
|
|
|
|
void kcsan_nestable_atomic_end(void)
|
|
|
|
{
|
|
|
|
if (get_ctx()->atomic_nest_count-- == 0) {
|
|
|
|
/*
|
|
|
|
* Warn if kcsan_nestable_atomic_end() calls are unbalanced with
|
|
|
|
* kcsan_nestable_atomic_begin() calls, which causes
|
|
|
|
* atomic_nest_count to become negative and should not happen.
|
|
|
|
*/
|
|
|
|
kcsan_nestable_atomic_begin(); /* restore to 0 */
|
|
|
|
kcsan_disable_current(); /* disable to generate warning */
|
|
|
|
WARN(1, "Unbalanced %s()", __func__);
|
|
|
|
kcsan_enable_current();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kcsan_nestable_atomic_end);
|
|
|
|
|
|
|
|
void kcsan_flat_atomic_begin(void)
|
|
|
|
{
|
|
|
|
get_ctx()->in_flat_atomic = true;
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kcsan_flat_atomic_begin);
|
|
|
|
|
|
|
|
void kcsan_flat_atomic_end(void)
|
|
|
|
{
|
|
|
|
get_ctx()->in_flat_atomic = false;
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kcsan_flat_atomic_end);
|
|
|
|
|
|
|
|
void kcsan_atomic_next(int n)
|
|
|
|
{
|
|
|
|
get_ctx()->atomic_next = n;
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kcsan_atomic_next);
|
|
|
|
|
2020-02-11 17:04:22 +01:00
|
|
|
void kcsan_set_access_mask(unsigned long mask)
|
|
|
|
{
|
|
|
|
get_ctx()->access_mask = mask;
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kcsan_set_access_mask);
|
|
|
|
|
kcsan: Add support for scoped accesses
This adds support for scoped accesses, where the memory range is checked
for the duration of the scope. The feature is implemented by inserting
the relevant access information into a list of scoped accesses for
the current execution context, which are then checked (until removed)
on every call (through instrumentation) into the KCSAN runtime.
An alternative, more complex, implementation could set up a watchpoint for
the scoped access, and keep the watchpoint set up. This, however, would
require first exposing a handle to the watchpoint, as well as dealing
with cases such as accesses by the same thread while the watchpoint is
still set up (and several more cases). It is also doubtful if this would
provide any benefit, since the majority of delay where the watchpoint
is set up is likely due to the injected delays by KCSAN. Therefore,
the implementation in this patch is simpler and avoids hurting KCSAN's
main use-case (normal data race detection); it also implicitly increases
scoped-access race-detection-ability due to increased probability of
setting up watchpoints by repeatedly calling __kcsan_check_access()
throughout the scope of the access.
The implementation required adding an additional conditional branch to
the fast-path. However, the microbenchmark showed a *speedup* of ~5%
on the fast-path. This appears to be due to subtly improved codegen by
GCC from moving get_ctx() and associated load of preempt_count earlier.
Suggested-by: Boqun Feng <boqun.feng@gmail.com>
Suggested-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-03-25 17:41:56 +01:00
|
|
|
struct kcsan_scoped_access *
|
|
|
|
kcsan_begin_scoped_access(const volatile void *ptr, size_t size, int type,
|
|
|
|
struct kcsan_scoped_access *sa)
|
|
|
|
{
|
|
|
|
struct kcsan_ctx *ctx = get_ctx();
|
|
|
|
|
2021-08-09 13:25:12 +02:00
|
|
|
check_access(ptr, size, type, _RET_IP_);
|
kcsan: Add support for scoped accesses
This adds support for scoped accesses, where the memory range is checked
for the duration of the scope. The feature is implemented by inserting
the relevant access information into a list of scoped accesses for
the current execution context, which are then checked (until removed)
on every call (through instrumentation) into the KCSAN runtime.
An alternative, more complex, implementation could set up a watchpoint for
the scoped access, and keep the watchpoint set up. This, however, would
require first exposing a handle to the watchpoint, as well as dealing
with cases such as accesses by the same thread while the watchpoint is
still set up (and several more cases). It is also doubtful if this would
provide any benefit, since the majority of delay where the watchpoint
is set up is likely due to the injected delays by KCSAN. Therefore,
the implementation in this patch is simpler and avoids hurting KCSAN's
main use-case (normal data race detection); it also implicitly increases
scoped-access race-detection-ability due to increased probability of
setting up watchpoints by repeatedly calling __kcsan_check_access()
throughout the scope of the access.
The implementation required adding an additional conditional branch to
the fast-path. However, the microbenchmark showed a *speedup* of ~5%
on the fast-path. This appears to be due to subtly improved codegen by
GCC from moving get_ctx() and associated load of preempt_count earlier.
Suggested-by: Boqun Feng <boqun.feng@gmail.com>
Suggested-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-03-25 17:41:56 +01:00
|
|
|
|
|
|
|
ctx->disable_count++; /* Disable KCSAN, in case list debugging is on. */
|
|
|
|
|
|
|
|
INIT_LIST_HEAD(&sa->list);
|
|
|
|
sa->ptr = ptr;
|
|
|
|
sa->size = size;
|
|
|
|
sa->type = type;
|
2021-08-09 13:25:13 +02:00
|
|
|
sa->ip = _RET_IP_;
|
kcsan: Add support for scoped accesses
This adds support for scoped accesses, where the memory range is checked
for the duration of the scope. The feature is implemented by inserting
the relevant access information into a list of scoped accesses for
the current execution context, which are then checked (until removed)
on every call (through instrumentation) into the KCSAN runtime.
An alternative, more complex, implementation could set up a watchpoint for
the scoped access, and keep the watchpoint set up. This, however, would
require first exposing a handle to the watchpoint, as well as dealing
with cases such as accesses by the same thread while the watchpoint is
still set up (and several more cases). It is also doubtful if this would
provide any benefit, since the majority of delay where the watchpoint
is set up is likely due to the injected delays by KCSAN. Therefore,
the implementation in this patch is simpler and avoids hurting KCSAN's
main use-case (normal data race detection); it also implicitly increases
scoped-access race-detection-ability due to increased probability of
setting up watchpoints by repeatedly calling __kcsan_check_access()
throughout the scope of the access.
The implementation required adding an additional conditional branch to
the fast-path. However, the microbenchmark showed a *speedup* of ~5%
on the fast-path. This appears to be due to subtly improved codegen by
GCC from moving get_ctx() and associated load of preempt_count earlier.
Suggested-by: Boqun Feng <boqun.feng@gmail.com>
Suggested-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-03-25 17:41:56 +01:00
|
|
|
|
|
|
|
if (!ctx->scoped_accesses.prev) /* Lazy initialize list head. */
|
|
|
|
INIT_LIST_HEAD(&ctx->scoped_accesses);
|
|
|
|
list_add(&sa->list, &ctx->scoped_accesses);
|
|
|
|
|
|
|
|
ctx->disable_count--;
|
|
|
|
return sa;
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kcsan_begin_scoped_access);
|
|
|
|
|
|
|
|
void kcsan_end_scoped_access(struct kcsan_scoped_access *sa)
|
|
|
|
{
|
|
|
|
struct kcsan_ctx *ctx = get_ctx();
|
|
|
|
|
|
|
|
if (WARN(!ctx->scoped_accesses.prev, "Unbalanced %s()?", __func__))
|
|
|
|
return;
|
|
|
|
|
|
|
|
ctx->disable_count++; /* Disable KCSAN, in case list debugging is on. */
|
|
|
|
|
|
|
|
list_del(&sa->list);
|
|
|
|
if (list_empty(&ctx->scoped_accesses))
|
|
|
|
/*
|
|
|
|
* Ensure we do not enter kcsan_check_scoped_accesses()
|
|
|
|
* slow-path if unnecessary, and avoids requiring list_empty()
|
|
|
|
* in the fast-path (to avoid a READ_ONCE() and potential
|
|
|
|
* uaccess warning).
|
|
|
|
*/
|
|
|
|
ctx->scoped_accesses.prev = NULL;
|
|
|
|
|
|
|
|
ctx->disable_count--;
|
|
|
|
|
2021-08-09 13:25:13 +02:00
|
|
|
check_access(sa->ptr, sa->size, sa->type, sa->ip);
|
kcsan: Add support for scoped accesses
This adds support for scoped accesses, where the memory range is checked
for the duration of the scope. The feature is implemented by inserting
the relevant access information into a list of scoped accesses for
the current execution context, which are then checked (until removed)
on every call (through instrumentation) into the KCSAN runtime.
An alternative, more complex, implementation could set up a watchpoint for
the scoped access, and keep the watchpoint set up. This, however, would
require first exposing a handle to the watchpoint, as well as dealing
with cases such as accesses by the same thread while the watchpoint is
still set up (and several more cases). It is also doubtful if this would
provide any benefit, since the majority of delay where the watchpoint
is set up is likely due to the injected delays by KCSAN. Therefore,
the implementation in this patch is simpler and avoids hurting KCSAN's
main use-case (normal data race detection); it also implicitly increases
scoped-access race-detection-ability due to increased probability of
setting up watchpoints by repeatedly calling __kcsan_check_access()
throughout the scope of the access.
The implementation required adding an additional conditional branch to
the fast-path. However, the microbenchmark showed a *speedup* of ~5%
on the fast-path. This appears to be due to subtly improved codegen by
GCC from moving get_ctx() and associated load of preempt_count earlier.
Suggested-by: Boqun Feng <boqun.feng@gmail.com>
Suggested-by: Paul E. McKenney <paulmck@kernel.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-03-25 17:41:56 +01:00
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kcsan_end_scoped_access);
|
|
|
|
|
2019-11-14 19:02:54 +01:00
|
|
|
void __kcsan_check_access(const volatile void *ptr, size_t size, int type)
|
|
|
|
{
|
2021-08-09 13:25:12 +02:00
|
|
|
check_access(ptr, size, type, _RET_IP_);
|
2019-11-14 19:02:54 +01:00
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(__kcsan_check_access);
|
|
|
|
|
2021-11-30 12:44:13 +01:00
|
|
|
#define DEFINE_MEMORY_BARRIER(name, order_before_cond) \
|
|
|
|
void __kcsan_##name(void) \
|
|
|
|
{ \
|
|
|
|
struct kcsan_scoped_access *sa = get_reorder_access(get_ctx()); \
|
|
|
|
if (!sa) \
|
|
|
|
return; \
|
|
|
|
if (order_before_cond) \
|
|
|
|
sa->size = 0; \
|
|
|
|
} \
|
|
|
|
EXPORT_SYMBOL(__kcsan_##name)
|
|
|
|
|
|
|
|
DEFINE_MEMORY_BARRIER(mb, true);
|
|
|
|
DEFINE_MEMORY_BARRIER(wmb, sa->type & (KCSAN_ACCESS_WRITE | KCSAN_ACCESS_COMPOUND));
|
|
|
|
DEFINE_MEMORY_BARRIER(rmb, !(sa->type & KCSAN_ACCESS_WRITE) || (sa->type & KCSAN_ACCESS_COMPOUND));
|
|
|
|
DEFINE_MEMORY_BARRIER(release, true);
|
|
|
|
|
2019-11-14 19:02:54 +01:00
|
|
|
/*
|
|
|
|
* KCSAN uses the same instrumentation that is emitted by supported compilers
|
|
|
|
* for ThreadSanitizer (TSAN).
|
|
|
|
*
|
|
|
|
* When enabled, the compiler emits instrumentation calls (the functions
|
|
|
|
* prefixed with "__tsan" below) for all loads and stores that it generated;
|
|
|
|
* inline asm is not instrumented.
|
|
|
|
*
|
|
|
|
* Note that, not all supported compiler versions distinguish aligned/unaligned
|
|
|
|
* accesses, but e.g. recent versions of Clang do. We simply alias the unaligned
|
|
|
|
* version to the generic version, which can handle both.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#define DEFINE_TSAN_READ_WRITE(size) \
|
2020-06-16 14:36:22 +02:00
|
|
|
void __tsan_read##size(void *ptr); \
|
2019-11-14 19:02:54 +01:00
|
|
|
void __tsan_read##size(void *ptr) \
|
|
|
|
{ \
|
2021-08-09 13:25:12 +02:00
|
|
|
check_access(ptr, size, 0, _RET_IP_); \
|
2019-11-14 19:02:54 +01:00
|
|
|
} \
|
|
|
|
EXPORT_SYMBOL(__tsan_read##size); \
|
|
|
|
void __tsan_unaligned_read##size(void *ptr) \
|
|
|
|
__alias(__tsan_read##size); \
|
|
|
|
EXPORT_SYMBOL(__tsan_unaligned_read##size); \
|
2020-06-16 14:36:22 +02:00
|
|
|
void __tsan_write##size(void *ptr); \
|
2019-11-14 19:02:54 +01:00
|
|
|
void __tsan_write##size(void *ptr) \
|
|
|
|
{ \
|
2021-08-09 13:25:12 +02:00
|
|
|
check_access(ptr, size, KCSAN_ACCESS_WRITE, _RET_IP_); \
|
2019-11-14 19:02:54 +01:00
|
|
|
} \
|
|
|
|
EXPORT_SYMBOL(__tsan_write##size); \
|
|
|
|
void __tsan_unaligned_write##size(void *ptr) \
|
|
|
|
__alias(__tsan_write##size); \
|
kcsan: Support compounded read-write instrumentation
Add support for compounded read-write instrumentation if supported by
the compiler. Adds the necessary instrumentation functions, and a new
type which is used to generate a more descriptive report.
Furthermore, such compounded memory access instrumentation is excluded
from the "assume aligned writes up to word size are atomic" rule,
because we cannot assume that the compiler emits code that is atomic for
compound ops.
LLVM/Clang added support for the feature in:
https://github.com/llvm/llvm-project/commit/785d41a261d136b64ab6c15c5d35f2adc5ad53e3
The new instrumentation is emitted for sets of memory accesses in the
same basic block to the same address with at least one read appearing
before a write. These typically result from compound operations such as
++, --, +=, -=, |=, &=, etc. but also equivalent forms such as "var =
var + 1". Where the compiler determines that it is equivalent to emit a
call to a single __tsan_read_write instead of separate __tsan_read and
__tsan_write, we can then benefit from improved performance and better
reporting for such access patterns.
The new reports now show that the ops are both reads and writes, for
example:
read-write to 0xffffffff90548a38 of 8 bytes by task 143 on cpu 3:
test_kernel_rmw_array+0x45/0xa0
access_thread+0x71/0xb0
kthread+0x21e/0x240
ret_from_fork+0x22/0x30
read-write to 0xffffffff90548a38 of 8 bytes by task 144 on cpu 2:
test_kernel_rmw_array+0x45/0xa0
access_thread+0x71/0xb0
kthread+0x21e/0x240
ret_from_fork+0x22/0x30
Acked-by: Peter Zijlstra (Intel) <peterz@infradead.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-07-24 09:00:01 +02:00
|
|
|
EXPORT_SYMBOL(__tsan_unaligned_write##size); \
|
|
|
|
void __tsan_read_write##size(void *ptr); \
|
|
|
|
void __tsan_read_write##size(void *ptr) \
|
|
|
|
{ \
|
|
|
|
check_access(ptr, size, \
|
2021-08-09 13:25:12 +02:00
|
|
|
KCSAN_ACCESS_COMPOUND | KCSAN_ACCESS_WRITE, \
|
|
|
|
_RET_IP_); \
|
kcsan: Support compounded read-write instrumentation
Add support for compounded read-write instrumentation if supported by
the compiler. Adds the necessary instrumentation functions, and a new
type which is used to generate a more descriptive report.
Furthermore, such compounded memory access instrumentation is excluded
from the "assume aligned writes up to word size are atomic" rule,
because we cannot assume that the compiler emits code that is atomic for
compound ops.
LLVM/Clang added support for the feature in:
https://github.com/llvm/llvm-project/commit/785d41a261d136b64ab6c15c5d35f2adc5ad53e3
The new instrumentation is emitted for sets of memory accesses in the
same basic block to the same address with at least one read appearing
before a write. These typically result from compound operations such as
++, --, +=, -=, |=, &=, etc. but also equivalent forms such as "var =
var + 1". Where the compiler determines that it is equivalent to emit a
call to a single __tsan_read_write instead of separate __tsan_read and
__tsan_write, we can then benefit from improved performance and better
reporting for such access patterns.
The new reports now show that the ops are both reads and writes, for
example:
read-write to 0xffffffff90548a38 of 8 bytes by task 143 on cpu 3:
test_kernel_rmw_array+0x45/0xa0
access_thread+0x71/0xb0
kthread+0x21e/0x240
ret_from_fork+0x22/0x30
read-write to 0xffffffff90548a38 of 8 bytes by task 144 on cpu 2:
test_kernel_rmw_array+0x45/0xa0
access_thread+0x71/0xb0
kthread+0x21e/0x240
ret_from_fork+0x22/0x30
Acked-by: Peter Zijlstra (Intel) <peterz@infradead.org>
Signed-off-by: Marco Elver <elver@google.com>
Signed-off-by: Paul E. McKenney <paulmck@kernel.org>
2020-07-24 09:00:01 +02:00
|
|
|
} \
|
|
|
|
EXPORT_SYMBOL(__tsan_read_write##size); \
|
|
|
|
void __tsan_unaligned_read_write##size(void *ptr) \
|
|
|
|
__alias(__tsan_read_write##size); \
|
|
|
|
EXPORT_SYMBOL(__tsan_unaligned_read_write##size)
|
2019-11-14 19:02:54 +01:00
|
|
|
|
|
|
|
DEFINE_TSAN_READ_WRITE(1);
|
|
|
|
DEFINE_TSAN_READ_WRITE(2);
|
|
|
|
DEFINE_TSAN_READ_WRITE(4);
|
|
|
|
DEFINE_TSAN_READ_WRITE(8);
|
|
|
|
DEFINE_TSAN_READ_WRITE(16);
|
|
|
|
|
2020-06-16 14:36:22 +02:00
|
|
|
void __tsan_read_range(void *ptr, size_t size);
|
2019-11-14 19:02:54 +01:00
|
|
|
void __tsan_read_range(void *ptr, size_t size)
|
|
|
|
{
|
2021-08-09 13:25:12 +02:00
|
|
|
check_access(ptr, size, 0, _RET_IP_);
|
2019-11-14 19:02:54 +01:00
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(__tsan_read_range);
|
|
|
|
|
2020-06-16 14:36:22 +02:00
|
|
|
void __tsan_write_range(void *ptr, size_t size);
|
2019-11-14 19:02:54 +01:00
|
|
|
void __tsan_write_range(void *ptr, size_t size)
|
|
|
|
{
|
2021-08-09 13:25:12 +02:00
|
|
|
check_access(ptr, size, KCSAN_ACCESS_WRITE, _RET_IP_);
|
2019-11-14 19:02:54 +01:00
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(__tsan_write_range);
|
|
|
|
|
2020-05-21 16:20:39 +02:00
|
|
|
/*
|
|
|
|
* Use of explicit volatile is generally disallowed [1], however, volatile is
|
|
|
|
* still used in various concurrent context, whether in low-level
|
|
|
|
* synchronization primitives or for legacy reasons.
|
|
|
|
* [1] https://lwn.net/Articles/233479/
|
|
|
|
*
|
|
|
|
* We only consider volatile accesses atomic if they are aligned and would pass
|
|
|
|
* the size-check of compiletime_assert_rwonce_type().
|
|
|
|
*/
|
|
|
|
#define DEFINE_TSAN_VOLATILE_READ_WRITE(size) \
|
2020-06-16 14:36:22 +02:00
|
|
|
void __tsan_volatile_read##size(void *ptr); \
|
2020-05-21 16:20:39 +02:00
|
|
|
void __tsan_volatile_read##size(void *ptr) \
|
|
|
|
{ \
|
|
|
|
const bool is_atomic = size <= sizeof(long long) && \
|
|
|
|
IS_ALIGNED((unsigned long)ptr, size); \
|
|
|
|
if (IS_ENABLED(CONFIG_KCSAN_IGNORE_ATOMICS) && is_atomic) \
|
|
|
|
return; \
|
2021-08-09 13:25:12 +02:00
|
|
|
check_access(ptr, size, is_atomic ? KCSAN_ACCESS_ATOMIC : 0, \
|
|
|
|
_RET_IP_); \
|
2020-05-21 16:20:39 +02:00
|
|
|
} \
|
|
|
|
EXPORT_SYMBOL(__tsan_volatile_read##size); \
|
|
|
|
void __tsan_unaligned_volatile_read##size(void *ptr) \
|
|
|
|
__alias(__tsan_volatile_read##size); \
|
|
|
|
EXPORT_SYMBOL(__tsan_unaligned_volatile_read##size); \
|
2020-06-16 14:36:22 +02:00
|
|
|
void __tsan_volatile_write##size(void *ptr); \
|
2020-05-21 16:20:39 +02:00
|
|
|
void __tsan_volatile_write##size(void *ptr) \
|
|
|
|
{ \
|
|
|
|
const bool is_atomic = size <= sizeof(long long) && \
|
|
|
|
IS_ALIGNED((unsigned long)ptr, size); \
|
|
|
|
if (IS_ENABLED(CONFIG_KCSAN_IGNORE_ATOMICS) && is_atomic) \
|
|
|
|
return; \
|
|
|
|
check_access(ptr, size, \
|
|
|
|
KCSAN_ACCESS_WRITE | \
|
2021-08-09 13:25:12 +02:00
|
|
|
(is_atomic ? KCSAN_ACCESS_ATOMIC : 0), \
|
|
|
|
_RET_IP_); \
|
2020-05-21 16:20:39 +02:00
|
|
|
} \
|
|
|
|
EXPORT_SYMBOL(__tsan_volatile_write##size); \
|
|
|
|
void __tsan_unaligned_volatile_write##size(void *ptr) \
|
|
|
|
__alias(__tsan_volatile_write##size); \
|
|
|
|
EXPORT_SYMBOL(__tsan_unaligned_volatile_write##size)
|
|
|
|
|
|
|
|
DEFINE_TSAN_VOLATILE_READ_WRITE(1);
|
|
|
|
DEFINE_TSAN_VOLATILE_READ_WRITE(2);
|
|
|
|
DEFINE_TSAN_VOLATILE_READ_WRITE(4);
|
|
|
|
DEFINE_TSAN_VOLATILE_READ_WRITE(8);
|
|
|
|
DEFINE_TSAN_VOLATILE_READ_WRITE(16);
|
|
|
|
|
2019-11-14 19:02:54 +01:00
|
|
|
/*
|
2021-08-05 14:57:45 +02:00
|
|
|
* Function entry and exit are used to determine the validty of reorder_access.
|
|
|
|
* Reordering of the access ends at the end of the function scope where the
|
|
|
|
* access happened. This is done for two reasons:
|
|
|
|
*
|
|
|
|
* 1. Artificially limits the scope where missing barriers are detected.
|
|
|
|
* This minimizes false positives due to uninstrumented functions that
|
|
|
|
* contain the required barriers but were missed.
|
|
|
|
*
|
|
|
|
* 2. Simplifies generating the stack trace of the access.
|
2019-11-14 19:02:54 +01:00
|
|
|
*/
|
2020-06-16 14:36:22 +02:00
|
|
|
void __tsan_func_entry(void *call_pc);
|
2021-08-05 14:57:45 +02:00
|
|
|
noinline void __tsan_func_entry(void *call_pc)
|
2019-11-14 19:02:54 +01:00
|
|
|
{
|
2021-08-05 14:57:45 +02:00
|
|
|
if (!IS_ENABLED(CONFIG_KCSAN_WEAK_MEMORY))
|
|
|
|
return;
|
|
|
|
|
|
|
|
add_kcsan_stack_depth(1);
|
2019-11-14 19:02:54 +01:00
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(__tsan_func_entry);
|
2021-08-05 14:57:45 +02:00
|
|
|
|
2020-06-16 14:36:22 +02:00
|
|
|
void __tsan_func_exit(void);
|
2021-08-05 14:57:45 +02:00
|
|
|
noinline void __tsan_func_exit(void)
|
2019-11-14 19:02:54 +01:00
|
|
|
{
|
2021-08-05 14:57:45 +02:00
|
|
|
struct kcsan_scoped_access *reorder_access;
|
|
|
|
|
|
|
|
if (!IS_ENABLED(CONFIG_KCSAN_WEAK_MEMORY))
|
|
|
|
return;
|
|
|
|
|
|
|
|
reorder_access = get_reorder_access(get_ctx());
|
|
|
|
if (!reorder_access)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
if (get_kcsan_stack_depth() <= reorder_access->stack_depth) {
|
|
|
|
/*
|
|
|
|
* Access check to catch cases where write without a barrier
|
|
|
|
* (supposed release) was last access in function: because
|
|
|
|
* instrumentation is inserted before the real access, a data
|
|
|
|
* race due to the write giving up a c-s would only be caught if
|
|
|
|
* we do the conflicting access after.
|
|
|
|
*/
|
|
|
|
check_access(reorder_access->ptr, reorder_access->size,
|
|
|
|
reorder_access->type, reorder_access->ip);
|
|
|
|
reorder_access->size = 0;
|
|
|
|
reorder_access->stack_depth = INT_MIN;
|
|
|
|
}
|
|
|
|
out:
|
|
|
|
add_kcsan_stack_depth(-1);
|
2019-11-14 19:02:54 +01:00
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(__tsan_func_exit);
|
2021-08-05 14:57:45 +02:00
|
|
|
|
2020-06-16 14:36:22 +02:00
|
|
|
void __tsan_init(void);
|
2019-11-14 19:02:54 +01:00
|
|
|
void __tsan_init(void)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(__tsan_init);
|
2020-07-03 15:40:29 +02:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Instrumentation for atomic builtins (__atomic_*, __sync_*).
|
|
|
|
*
|
|
|
|
* Normal kernel code _should not_ be using them directly, but some
|
|
|
|
* architectures may implement some or all atomics using the compilers'
|
|
|
|
* builtins.
|
|
|
|
*
|
|
|
|
* Note: If an architecture decides to fully implement atomics using the
|
|
|
|
* builtins, because they are implicitly instrumented by KCSAN (and KASAN,
|
|
|
|
* etc.), implementing the ARCH_ATOMIC interface (to get instrumentation via
|
|
|
|
* atomic-instrumented) is no longer necessary.
|
|
|
|
*
|
|
|
|
* TSAN instrumentation replaces atomic accesses with calls to any of the below
|
|
|
|
* functions, whose job is to also execute the operation itself.
|
|
|
|
*/
|
|
|
|
|
2021-11-30 12:44:13 +01:00
|
|
|
static __always_inline void kcsan_atomic_builtin_memorder(int memorder)
|
|
|
|
{
|
|
|
|
if (memorder == __ATOMIC_RELEASE ||
|
|
|
|
memorder == __ATOMIC_SEQ_CST ||
|
|
|
|
memorder == __ATOMIC_ACQ_REL)
|
|
|
|
__kcsan_release();
|
|
|
|
}
|
|
|
|
|
2020-07-03 15:40:29 +02:00
|
|
|
#define DEFINE_TSAN_ATOMIC_LOAD_STORE(bits) \
|
|
|
|
u##bits __tsan_atomic##bits##_load(const u##bits *ptr, int memorder); \
|
|
|
|
u##bits __tsan_atomic##bits##_load(const u##bits *ptr, int memorder) \
|
|
|
|
{ \
|
2021-11-30 12:44:13 +01:00
|
|
|
kcsan_atomic_builtin_memorder(memorder); \
|
2020-07-24 09:00:04 +02:00
|
|
|
if (!IS_ENABLED(CONFIG_KCSAN_IGNORE_ATOMICS)) { \
|
2021-08-09 13:25:12 +02:00
|
|
|
check_access(ptr, bits / BITS_PER_BYTE, KCSAN_ACCESS_ATOMIC, _RET_IP_); \
|
2020-07-24 09:00:04 +02:00
|
|
|
} \
|
2020-07-03 15:40:29 +02:00
|
|
|
return __atomic_load_n(ptr, memorder); \
|
|
|
|
} \
|
|
|
|
EXPORT_SYMBOL(__tsan_atomic##bits##_load); \
|
|
|
|
void __tsan_atomic##bits##_store(u##bits *ptr, u##bits v, int memorder); \
|
|
|
|
void __tsan_atomic##bits##_store(u##bits *ptr, u##bits v, int memorder) \
|
|
|
|
{ \
|
2021-11-30 12:44:13 +01:00
|
|
|
kcsan_atomic_builtin_memorder(memorder); \
|
2020-07-24 09:00:04 +02:00
|
|
|
if (!IS_ENABLED(CONFIG_KCSAN_IGNORE_ATOMICS)) { \
|
|
|
|
check_access(ptr, bits / BITS_PER_BYTE, \
|
2021-08-09 13:25:12 +02:00
|
|
|
KCSAN_ACCESS_WRITE | KCSAN_ACCESS_ATOMIC, _RET_IP_); \
|
2020-07-24 09:00:04 +02:00
|
|
|
} \
|
2020-07-03 15:40:29 +02:00
|
|
|
__atomic_store_n(ptr, v, memorder); \
|
|
|
|
} \
|
|
|
|
EXPORT_SYMBOL(__tsan_atomic##bits##_store)
|
|
|
|
|
|
|
|
#define DEFINE_TSAN_ATOMIC_RMW(op, bits, suffix) \
|
|
|
|
u##bits __tsan_atomic##bits##_##op(u##bits *ptr, u##bits v, int memorder); \
|
|
|
|
u##bits __tsan_atomic##bits##_##op(u##bits *ptr, u##bits v, int memorder) \
|
|
|
|
{ \
|
2021-11-30 12:44:13 +01:00
|
|
|
kcsan_atomic_builtin_memorder(memorder); \
|
2020-07-24 09:00:04 +02:00
|
|
|
if (!IS_ENABLED(CONFIG_KCSAN_IGNORE_ATOMICS)) { \
|
|
|
|
check_access(ptr, bits / BITS_PER_BYTE, \
|
|
|
|
KCSAN_ACCESS_COMPOUND | KCSAN_ACCESS_WRITE | \
|
2021-08-09 13:25:12 +02:00
|
|
|
KCSAN_ACCESS_ATOMIC, _RET_IP_); \
|
2020-07-24 09:00:04 +02:00
|
|
|
} \
|
2020-07-03 15:40:29 +02:00
|
|
|
return __atomic_##op##suffix(ptr, v, memorder); \
|
|
|
|
} \
|
|
|
|
EXPORT_SYMBOL(__tsan_atomic##bits##_##op)
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Note: CAS operations are always classified as write, even in case they
|
|
|
|
* fail. We cannot perform check_access() after a write, as it might lead to
|
|
|
|
* false positives, in cases such as:
|
|
|
|
*
|
|
|
|
* T0: __atomic_compare_exchange_n(&p->flag, &old, 1, ...)
|
|
|
|
*
|
|
|
|
* T1: if (__atomic_load_n(&p->flag, ...)) {
|
|
|
|
* modify *p;
|
|
|
|
* p->flag = 0;
|
|
|
|
* }
|
|
|
|
*
|
|
|
|
* The only downside is that, if there are 3 threads, with one CAS that
|
|
|
|
* succeeds, another CAS that fails, and an unmarked racing operation, we may
|
|
|
|
* point at the wrong CAS as the source of the race. However, if we assume that
|
|
|
|
* all CAS can succeed in some other execution, the data race is still valid.
|
|
|
|
*/
|
|
|
|
#define DEFINE_TSAN_ATOMIC_CMPXCHG(bits, strength, weak) \
|
|
|
|
int __tsan_atomic##bits##_compare_exchange_##strength(u##bits *ptr, u##bits *exp, \
|
|
|
|
u##bits val, int mo, int fail_mo); \
|
|
|
|
int __tsan_atomic##bits##_compare_exchange_##strength(u##bits *ptr, u##bits *exp, \
|
|
|
|
u##bits val, int mo, int fail_mo) \
|
|
|
|
{ \
|
2021-11-30 12:44:13 +01:00
|
|
|
kcsan_atomic_builtin_memorder(mo); \
|
2020-07-24 09:00:04 +02:00
|
|
|
if (!IS_ENABLED(CONFIG_KCSAN_IGNORE_ATOMICS)) { \
|
|
|
|
check_access(ptr, bits / BITS_PER_BYTE, \
|
|
|
|
KCSAN_ACCESS_COMPOUND | KCSAN_ACCESS_WRITE | \
|
2021-08-09 13:25:12 +02:00
|
|
|
KCSAN_ACCESS_ATOMIC, _RET_IP_); \
|
2020-07-24 09:00:04 +02:00
|
|
|
} \
|
2020-07-03 15:40:29 +02:00
|
|
|
return __atomic_compare_exchange_n(ptr, exp, val, weak, mo, fail_mo); \
|
|
|
|
} \
|
|
|
|
EXPORT_SYMBOL(__tsan_atomic##bits##_compare_exchange_##strength)
|
|
|
|
|
|
|
|
#define DEFINE_TSAN_ATOMIC_CMPXCHG_VAL(bits) \
|
|
|
|
u##bits __tsan_atomic##bits##_compare_exchange_val(u##bits *ptr, u##bits exp, u##bits val, \
|
|
|
|
int mo, int fail_mo); \
|
|
|
|
u##bits __tsan_atomic##bits##_compare_exchange_val(u##bits *ptr, u##bits exp, u##bits val, \
|
|
|
|
int mo, int fail_mo) \
|
|
|
|
{ \
|
2021-11-30 12:44:13 +01:00
|
|
|
kcsan_atomic_builtin_memorder(mo); \
|
2020-07-24 09:00:04 +02:00
|
|
|
if (!IS_ENABLED(CONFIG_KCSAN_IGNORE_ATOMICS)) { \
|
|
|
|
check_access(ptr, bits / BITS_PER_BYTE, \
|
|
|
|
KCSAN_ACCESS_COMPOUND | KCSAN_ACCESS_WRITE | \
|
2021-08-09 13:25:12 +02:00
|
|
|
KCSAN_ACCESS_ATOMIC, _RET_IP_); \
|
2020-07-24 09:00:04 +02:00
|
|
|
} \
|
2020-07-03 15:40:29 +02:00
|
|
|
__atomic_compare_exchange_n(ptr, &exp, val, 0, mo, fail_mo); \
|
|
|
|
return exp; \
|
|
|
|
} \
|
|
|
|
EXPORT_SYMBOL(__tsan_atomic##bits##_compare_exchange_val)
|
|
|
|
|
|
|
|
#define DEFINE_TSAN_ATOMIC_OPS(bits) \
|
|
|
|
DEFINE_TSAN_ATOMIC_LOAD_STORE(bits); \
|
|
|
|
DEFINE_TSAN_ATOMIC_RMW(exchange, bits, _n); \
|
|
|
|
DEFINE_TSAN_ATOMIC_RMW(fetch_add, bits, ); \
|
|
|
|
DEFINE_TSAN_ATOMIC_RMW(fetch_sub, bits, ); \
|
|
|
|
DEFINE_TSAN_ATOMIC_RMW(fetch_and, bits, ); \
|
|
|
|
DEFINE_TSAN_ATOMIC_RMW(fetch_or, bits, ); \
|
|
|
|
DEFINE_TSAN_ATOMIC_RMW(fetch_xor, bits, ); \
|
|
|
|
DEFINE_TSAN_ATOMIC_RMW(fetch_nand, bits, ); \
|
|
|
|
DEFINE_TSAN_ATOMIC_CMPXCHG(bits, strong, 0); \
|
|
|
|
DEFINE_TSAN_ATOMIC_CMPXCHG(bits, weak, 1); \
|
|
|
|
DEFINE_TSAN_ATOMIC_CMPXCHG_VAL(bits)
|
|
|
|
|
|
|
|
DEFINE_TSAN_ATOMIC_OPS(8);
|
|
|
|
DEFINE_TSAN_ATOMIC_OPS(16);
|
|
|
|
DEFINE_TSAN_ATOMIC_OPS(32);
|
|
|
|
DEFINE_TSAN_ATOMIC_OPS(64);
|
|
|
|
|
|
|
|
void __tsan_atomic_thread_fence(int memorder);
|
|
|
|
void __tsan_atomic_thread_fence(int memorder)
|
|
|
|
{
|
2021-11-30 12:44:13 +01:00
|
|
|
kcsan_atomic_builtin_memorder(memorder);
|
2020-07-03 15:40:29 +02:00
|
|
|
__atomic_thread_fence(memorder);
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(__tsan_atomic_thread_fence);
|
|
|
|
|
2021-11-30 12:44:13 +01:00
|
|
|
/*
|
|
|
|
* In instrumented files, we emit instrumentation for barriers by mapping the
|
|
|
|
* kernel barriers to an __atomic_signal_fence(), which is interpreted specially
|
|
|
|
* and otherwise has no relation to a real __atomic_signal_fence(). No known
|
|
|
|
* kernel code uses __atomic_signal_fence().
|
|
|
|
*
|
|
|
|
* Since fsanitize=thread instrumentation handles __atomic_signal_fence(), which
|
|
|
|
* are turned into calls to __tsan_atomic_signal_fence(), such instrumentation
|
|
|
|
* can be disabled via the __no_kcsan function attribute (vs. an explicit call
|
|
|
|
* which could not). When __no_kcsan is requested, __atomic_signal_fence()
|
|
|
|
* generates no code.
|
|
|
|
*
|
|
|
|
* Note: The result of using __atomic_signal_fence() with KCSAN enabled is
|
|
|
|
* potentially limiting the compiler's ability to reorder operations; however,
|
|
|
|
* if barriers were instrumented with explicit calls (without LTO), the compiler
|
|
|
|
* couldn't optimize much anyway. The result of a hypothetical architecture
|
|
|
|
* using __atomic_signal_fence() in normal code would be KCSAN false negatives.
|
|
|
|
*/
|
2020-07-03 15:40:29 +02:00
|
|
|
void __tsan_atomic_signal_fence(int memorder);
|
2021-11-30 12:44:13 +01:00
|
|
|
noinline void __tsan_atomic_signal_fence(int memorder)
|
|
|
|
{
|
|
|
|
switch (memorder) {
|
|
|
|
case __KCSAN_BARRIER_TO_SIGNAL_FENCE_mb:
|
|
|
|
__kcsan_mb();
|
|
|
|
break;
|
|
|
|
case __KCSAN_BARRIER_TO_SIGNAL_FENCE_wmb:
|
|
|
|
__kcsan_wmb();
|
|
|
|
break;
|
|
|
|
case __KCSAN_BARRIER_TO_SIGNAL_FENCE_rmb:
|
|
|
|
__kcsan_rmb();
|
|
|
|
break;
|
|
|
|
case __KCSAN_BARRIER_TO_SIGNAL_FENCE_release:
|
|
|
|
__kcsan_release();
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2020-07-03 15:40:29 +02:00
|
|
|
EXPORT_SYMBOL(__tsan_atomic_signal_fence);
|