debug: Introduce portion of UBSan

without UBSan
```
 text    data     bss     dec     hex filename
  85612     208  142258  228078   37aee nuttx
```

with UBSan:
```
   text    data     bss     dec     hex filename
 194290   98164  208634  501088   7a560 nuttx
```

```c
int main(int argc, FAR char *argv[])
{
  uint32_t ptr[32];
  printf("Hello, World!! %lu\n", ptr[64]);
  return 0;
}
```
Try to run this sample:
```
nsh> hello
ubsan_prologue: ================================================================================
ubsan_prologue: UBSAN: array-index-out-of-bounds in hello_main.c:39:37
__ubsan_handle_out_of_bounds: index 64 is out of range for type 'uint32_t [32]'
ubsan_epilogue: ================================================================================
Hello, World!! 1070182368
nsh>
```

Signed-off-by: Huang Qi <huangqi3@xiaomi.com>
This commit is contained in:
Huang Qi 2022-08-19 08:09:59 +00:00 committed by Xiang Xiao
parent 49c50d3bf4
commit a06ec54cd0
16 changed files with 646 additions and 0 deletions

View file

@ -83,6 +83,14 @@ ifeq ($(CONFIG_MM_KASAN),y)
ARCHOPTIMIZATION += -fsanitize=kernel-address
endif
ifeq ($(CONFIG_MM_UBSAN_ALL),y)
ARCHOPTIMIZATION += -fsanitize=undefined
endif
ifeq ($(CONFIG_MM_UBSAN_TRAP_ON_ERROR),y)
ARCHOPTIMIZATION += -fsanitize-undefined-trap-on-error
endif
# NuttX buildroot under Linux or Cygwin
ifeq ($(CONFIG_ARM_TOOLCHAIN),BUILDROOT)

View file

@ -169,6 +169,14 @@ ifeq ($(CONFIG_MM_KASAN),y)
ARCHOPTIMIZATION += -fsanitize=kernel-address
endif
ifeq ($(CONFIG_MM_UBSAN_ALL),y)
ARCHOPTIMIZATION += -fsanitize=undefined
endif
ifeq ($(CONFIG_MM_UBSAN_TRAP_ON_ERROR),y)
ARCHOPTIMIZATION += -fsanitize-undefined-trap-on-error
endif
ARCHCFLAGS += -fno-common
ARCHCXXFLAGS += -fno-common -nostdinc++

View file

@ -124,6 +124,14 @@ ifeq ($(CONFIG_ARCH_COVERAGE),y)
ARCHOPTIMIZATION += -fprofile-generate -ftest-coverage
endif
ifeq ($(CONFIG_MM_UBSAN_ALL),y)
ARCHOPTIMIZATION += -fsanitize=undefined
endif
ifeq ($(CONFIG_MM_UBSAN_TRAP_ON_ERROR),y)
ARCHOPTIMIZATION += -fsanitize-undefined-trap-on-error
endif
ifeq ($(CONFIG_ENDIAN_BIG),y)
TARGET_ARCH := armeb
else

View file

@ -89,6 +89,14 @@ ifeq ($(CONFIG_ARMV7M_STACKCHECK),y)
ARCHOPTIMIZATION += -finstrument-functions -ffixed-r10
endif
ifeq ($(CONFIG_MM_UBSAN_ALL),y)
ARCHOPTIMIZATION += -fsanitize=undefined
endif
ifeq ($(CONFIG_MM_UBSAN_TRAP_ON_ERROR),y)
ARCHOPTIMIZATION += -fsanitize-undefined-trap-on-error
endif
# Parametrization for ARCHCPUFLAGS
ifeq ($(CONFIG_ARCH_CORTEXM4),y)

View file

@ -100,6 +100,14 @@ ifeq ($(CONFIG_MM_KASAN),y)
ARCHOPTIMIZATION += -fsanitize=kernel-address
endif
ifeq ($(CONFIG_MM_UBSAN_ALL),y)
ARCHOPTIMIZATION += -fsanitize=undefined
endif
ifeq ($(CONFIG_MM_UBSAN_TRAP_ON_ERROR),y)
ARCHOPTIMIZATION += -fsanitize-undefined-trap-on-error
endif
ifeq ($(CONFIG_ENDIAN_BIG),y)
TARGET_ARCH := armeb
else

View file

@ -89,6 +89,14 @@ ifeq ($(CONFIG_ARMV8M_STACKCHECK),y)
ARCHOPTIMIZATION += -finstrument-functions -ffixed-r10
endif
ifeq ($(CONFIG_MM_UBSAN_ALL),y)
ARCHOPTIMIZATION += -fsanitize=undefined
endif
ifeq ($(CONFIG_MM_UBSAN_TRAP_ON_ERROR),y)
ARCHOPTIMIZATION += -fsanitize-undefined-trap-on-error
endif
# Parametrization for ARCHCPUFLAGS
ifeq ($(CONFIG_ARCH_CORTEXM23),y)

View file

@ -62,6 +62,14 @@ ifeq ($(CONFIG_ARCH_COVERAGE),y)
ARCHOPTIMIZATION += -fprofile-generate -ftest-coverage
endif
ifeq ($(CONFIG_MM_UBSAN_ALL),y)
ARCHOPTIMIZATION += -fsanitize=undefined
endif
ifeq ($(CONFIG_MM_UBSAN_TRAP_ON_ERROR),y)
ARCHOPTIMIZATION += -fsanitize-undefined-trap-on-error
endif
ARCHCFLAGS += -fno-common
ARCHCXXFLAGS += -fno-common -nostdinc++

View file

@ -166,6 +166,14 @@ ifeq ($(CONFIG_MM_KASAN),y)
ARCHOPTIMIZATION += -fsanitize=kernel-address
endif
ifeq ($(CONFIG_MM_UBSAN_ALL),y)
ARCHOPTIMIZATION += -fsanitize=undefined
endif
ifeq ($(CONFIG_MM_UBSAN_TRAP_ON_ERROR),y)
ARCHOPTIMIZATION += -fsanitize-undefined-trap-on-error
endif
# Default toolchain
CC = $(CROSSDEV)gcc

View file

@ -47,6 +47,14 @@ ifeq ($(CONFIG_MM_KASAN),y)
ARCHOPTIMIZATION += -fsanitize=kernel-address
endif
ifeq ($(CONFIG_MM_UBSAN_ALL),y)
ARCHOPTIMIZATION += -fsanitize=undefined
endif
ifeq ($(CONFIG_MM_UBSAN_TRAP_ON_ERROR),y)
ARCHOPTIMIZATION += -fsanitize-undefined-trap-on-error
endif
ifeq ($(CONFIG_DEBUG_CUSTOMOPT),y)
ARCHOPTIMIZATION += $(CONFIG_DEBUG_OPTLEVEL)
else ifeq ($(CONFIG_DEBUG_FULLOPT),y)

View file

@ -47,6 +47,14 @@ ifeq ($(CONFIG_MM_KASAN),y)
ARCHOPTIMIZATION += -fsanitize=kernel-address
endif
ifeq ($(CONFIG_MM_UBSAN_ALL),y)
ARCHOPTIMIZATION += -fsanitize=undefined
endif
ifeq ($(CONFIG_MM_UBSAN_TRAP_ON_ERROR),y)
ARCHOPTIMIZATION += -fsanitize-undefined-trap-on-error
endif
ifeq ($(CONFIG_DEBUG_CUSTOMOPT),y)
ARCHOPTIMIZATION += $(CONFIG_DEBUG_OPTLEVEL)
else ifeq ($(CONFIG_DEBUG_FULLOPT),y)

View file

@ -79,6 +79,12 @@ endif
ifeq ($(CONFIG_SIM_UBSAN),y)
ARCHOPTIMIZATION += -fsanitize=undefined
else ifeq ($(CONFIG_MM_UBSAN_ALL),y)
ARCHOPTIMIZATION += -fsanitize=undefined
endif
ifeq ($(CONFIG_MM_UBSAN_TRAP_ON_ERROR),y)
ARCHOPTIMIZATION += -fsanitize-undefined-trap-on-error
endif
# Add -fno-common because macOS "ld -r" doesn't seem to pick objects

View file

@ -191,6 +191,34 @@ config MM_KASAN
bugs in native code. After turn on this option, Please
add -fsanitize=kernel-address to CFLAGS/CXXFLAGS too.
config MM_UBSAN
bool "Undefined Behavior Sanitizer"
default n
---help---
UBSan is a fast undefined behavior detector. UBSan modifies
the program at compile-time to catch various kinds of
undefined behavior during program execution
config MM_UBSAN_ALL
bool "Enable UBSan for the entire image"
depends on MM_UBSAN
default y
---help---
This option activates UBSan instrumentation for the
entire image. If you don't enable this option, you have to
explicitly specify "-fsanitize=undefined" for
the files/directories you want to check. Enabling this option
will get image size increased and performance decreased
significantly.
config MM_UBSAN_TRAP_ON_ERROR
bool "Enable UBsan trap on error to crash immediately"
depends on MM_UBSAN
default y
---help---
The undefined instruction trap should cause your program to crash,
save the code space significantly.
config MM_FILL_ALLOCATIONS
bool "Fill allocations with debug value"
default n

View file

@ -31,6 +31,7 @@ include iob/Make.defs
include circbuf/Make.defs
include mempool/Make.defs
include kasan/Make.defs
include ubsan/Make.defs
BINDIR ?= bin

28
mm/ubsan/Make.defs Normal file
View file

@ -0,0 +1,28 @@
############################################################################
# mm/ubsan/Make.defs
#
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright ownership. The
# ASF licenses this file to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance with the
# License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
# License for the specific language governing permissions and limitations
# under the License.
#
############################################################################
ifeq ($(CONFIG_MM_UBSAN),y)
CSRCS += ubsan.c
DEPPATH += --dep-path ubsan
VPATH += :ubsan
endif

377
mm/ubsan/ubsan.c Normal file
View file

@ -0,0 +1,377 @@
/****************************************************************************
* mm/ubsan/ubsan.c
*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership. The
* ASF licenses this file to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance with the
* License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
* License for the specific language governing permissions and limitations
* under the License.
*
****************************************************************************/
/****************************************************************************
* Included Files
****************************************************************************/
#include <nuttx/compiler.h>
#include <debug.h>
#include <stdio.h>
#include "ubsan.h"
/****************************************************************************
* Pre-processor Definitions
****************************************************************************/
#define IS_ALIGNED(x, a) (((x) & ((a) - 1)) == 0)
/****************************************************************************
* Private Data
****************************************************************************/
static FAR const char *const g_type_check_kinds[] =
{
"load of",
"store to",
"reference binding to",
"member access within",
"member call on",
"constructor call on",
"downcast of",
"downcast of"
};
/****************************************************************************
* Private Functions
****************************************************************************/
static void ubsan_prologue(FAR struct source_location *loc,
FAR const char *reason)
{
_alert("========================================"
"========================================\n");
_alert("UBSAN: %s in %s:%" PRIu32 ":%" PRIu32"\n",
reason, loc->file_name, loc->line, loc->column);
}
static void ubsan_epilogue(void)
{
_alert("========================================"
"========================================\n");
}
static void ubsan_prologue_epilogue(FAR struct source_location *loc,
FAR const char *reason)
{
ubsan_prologue(loc, reason);
ubsan_epilogue();
}
static void handle_null_ptr_deref(FAR struct type_mismatch_data_common *data)
{
ubsan_prologue(data->location, "null-pointer-dereference");
_alert("%s null pointer of type %s\n",
g_type_check_kinds[data->type_check_kind], data->type->type_name);
ubsan_epilogue();
}
static void handle_misaligned_access(
FAR struct type_mismatch_data_common *data, uintptr_t ptr)
{
ubsan_prologue(data->location, "misaligned-access");
_alert("%s misaligned address %p for type %s\n",
g_type_check_kinds[data->type_check_kind], (FAR void *)ptr,
data->type->type_name);
_alert("which requires %ld byte alignment\n", data->alignment);
ubsan_epilogue();
}
static void handle_object_size_mismatch(
FAR struct type_mismatch_data_common *data, uintptr_t ptr)
{
ubsan_prologue(data->location, "object-size-mismatch");
_alert("%s address %p with insufficient space\n",
g_type_check_kinds[data->type_check_kind], (FAR void *)ptr);
_alert("for an object of type %s\n", data->type->type_name);
ubsan_epilogue();
}
static void ubsan_type_mismatch_common(
FAR struct type_mismatch_data_common *data, uintptr_t ptr)
{
if (!ptr)
{
handle_null_ptr_deref(data);
}
else if (data->alignment && !IS_ALIGNED(ptr, data->alignment))
{
handle_misaligned_access(data, ptr);
}
else
{
handle_object_size_mismatch(data, ptr);
}
}
static bool type_is_int(FAR struct type_descriptor *type)
{
return type->type_kind == TYPE_KIND_INT;
}
static bool type_is_signed(FAR struct type_descriptor *type)
{
return type->type_info & 1;
}
static unsigned type_bit_width(FAR struct type_descriptor *type)
{
return 1 << (type->type_info >> 1);
}
static bool is_inline_int(FAR struct type_descriptor *type)
{
unsigned inline_bits = sizeof(uintptr_t) * 8;
unsigned bits = type_bit_width(type);
return bits <= inline_bits;
}
static int64_t get_signed_val(FAR struct type_descriptor *type,
FAR void *val)
{
if (is_inline_int(type))
{
unsigned extra_bits = sizeof(int64_t) * 8 - type_bit_width(type);
uintptr_t ulong_val = (uintptr_t)val;
return ((int64_t)ulong_val) << extra_bits >> extra_bits;
}
return *(FAR int64_t *)val;
}
static bool val_is_negative(FAR struct type_descriptor *type, FAR void *val)
{
return type_is_signed(type) && get_signed_val(type, val) < 0;
}
static uint64_t get_unsigned_val(FAR struct type_descriptor *type,
FAR void *val)
{
if (is_inline_int(type))
{
return (uintptr_t)val;
}
return *(uint64_t *)val;
}
static void val_to_string(FAR char *str, size_t size,
FAR struct type_descriptor *type,
FAR void *value)
{
if (type_is_int(type))
{
if (type_is_signed(type))
{
snprintf(str, size, "%" PRId64, get_signed_val(type, value));
}
else
{
snprintf(str, size, "%" PRIu64, get_unsigned_val(type, value));
}
}
}
/****************************************************************************
* Public Functions
****************************************************************************/
void __ubsan_handle_out_of_bounds(FAR void *data, FAR void *index)
{
FAR struct out_of_bounds_data *info = data;
char index_str[40];
ubsan_prologue(&info->location, "array-index-out-of-bounds");
val_to_string(index_str, sizeof(index_str), info->index_type, index);
_alert("index %s is out of range for type %s\n",
index_str, info->array_type->type_name);
ubsan_epilogue();
}
void __ubsan_handle_shift_out_of_bounds(FAR void *data,
FAR void *lhs, FAR void *rhs)
{
FAR struct shift_out_of_bounds_data *info = data;
FAR struct type_descriptor *rhs_type = info->rhs_type;
FAR struct type_descriptor *lhs_type = info->lhs_type;
char rhs_str[40];
char lhs_str[40];
ubsan_prologue(&info->location, "shift-out-of-bounds");
val_to_string(rhs_str, sizeof(rhs_str), rhs_type, rhs);
val_to_string(lhs_str, sizeof(lhs_str), lhs_type, lhs);
if (val_is_negative(rhs_type, rhs))
{
_alert("shift exponent %s is negative\n", rhs_str);
}
else if (get_unsigned_val(rhs_type, rhs) >= type_bit_width(lhs_type))
{
_alert("shift exponent %s is too large for %u-bit type %s\n",
rhs_str, type_bit_width(lhs_type), lhs_type->type_name);
}
else if (val_is_negative(lhs_type, lhs))
{
_alert("left shift of negative value %s\n", lhs_str);
}
else
{
_alert("left shift of %s by %s places cannot be"
" represented in type %s\n",
lhs_str, rhs_str, lhs_type->type_name);
}
ubsan_epilogue();
}
void __ubsan_handle_divrem_overflow(FAR void *data,
FAR void *lhs, FAR void *rhs)
{
FAR struct overflow_data *info = data;
char rhs_val_str[40];
ubsan_prologue(&info->location, "division-overflow");
val_to_string(rhs_val_str, sizeof(rhs_val_str), info->type, rhs);
if (type_is_signed(info->type) && get_signed_val(info->type, rhs) == -1)
{
_alert("division of %s by -1 cannot be represented in type %s\n",
rhs_val_str, info->type->type_name);
}
else
{
_alert("division by zero\n");
}
}
void __ubsan_handle_alignment_assumption(FAR void *data, uintptr_t ptr,
uintptr_t align, uintptr_t offset)
{
FAR struct alignment_assumption_data *info = data;
uintptr_t real_ptr;
ubsan_prologue(&info->location, "alignment-assumption");
if (offset)
{
_alert("assumption of %u byte alignment (with offset of %u byte) for "
"pointer of type %s failed",
align, offset, info->type->type_name);
}
else
{
_alert("assumption of %u byte alignment for pointer of type %s failed",
align, info->type->type_name);
}
real_ptr = ptr - offset;
_alert("%saddress is %lu aligned, misalignment offset is %u bytes",
offset ? "offset " : "",
1ul << (real_ptr ? ffsl(real_ptr) : 0),
real_ptr & (align - 1));
ubsan_epilogue();
}
void __ubsan_handle_type_mismatch(FAR struct type_mismatch_data *data,
FAR void *ptr)
{
struct type_mismatch_data_common common_data =
{
.location = &data->location,
.type = data->type,
.alignment = data->alignment,
.type_check_kind = data->type_check_kind
};
ubsan_type_mismatch_common(&common_data, (uintptr_t)ptr);
}
void __ubsan_handle_type_mismatch_v1(FAR void *_data, FAR void *ptr)
{
FAR struct type_mismatch_data_v1 *data = _data;
struct type_mismatch_data_common common_data =
{
.location = &data->location,
.type = data->type,
.alignment = 1ul << data->log_alignment,
.type_check_kind = data->type_check_kind
};
ubsan_type_mismatch_common(&common_data, (uintptr_t)ptr);
}
void __ubsan_handle_builtin_unreachable(FAR void *data)
{
ubsan_prologue_epilogue(data, "unreachable");
PANIC();
}
void __ubsan_handle_nonnull_arg(FAR void *data)
{
ubsan_prologue_epilogue(data, "nonnull-arg");
}
void __ubsan_handle_add_overflow(FAR void *data,
FAR void *lhs, FAR void *rhs)
{
ubsan_prologue_epilogue(data, "add-overflow");
}
void __ubsan_handle_sub_overflow(FAR void *data,
FAR void *lhs, FAR void *rhs)
{
ubsan_prologue_epilogue(data, "sub-overflow");
}
void __ubsan_handle_mul_overflow(FAR void *data,
FAR void *lhs, FAR void *rhs)
{
ubsan_prologue_epilogue(data, "mul-overflow");
}
void __ubsan_handle_load_invalid_value(FAR void *data, FAR void *ptr)
{
ubsan_prologue_epilogue(data, "load-invalid-value");
}
void __ubsan_handle_negate_overflow(FAR void *data, FAR void *ptr)
{
ubsan_prologue_epilogue(data, "negate-overflow");
}
void __ubsan_handle_pointer_overflow(FAR void *data,
FAR void *ptr, FAR void *result)
{
ubsan_prologue_epilogue(data, "pointer-overflow");
}

126
mm/ubsan/ubsan.h Normal file
View file

@ -0,0 +1,126 @@
/****************************************************************************
* mm/ubsan/ubsan.h
*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership. The
* ASF licenses this file to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance with the
* License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
* License for the specific language governing permissions and limitations
* under the License.
*
****************************************************************************/
#ifndef __MM_UBSAN_UBSAN_H
#define __MM_UBSAN_UBSAN_H
/****************************************************************************
* Included Files
****************************************************************************/
#include <stdint.h>
/****************************************************************************
* Public Types
****************************************************************************/
enum type_kind_e
{
TYPE_KIND_INT = 0,
TYPE_KIND_FLOAT = 1,
TYPE_KIND_UNKNOWN = 0xffff
};
struct type_descriptor
{
uint16_t type_kind;
uint16_t type_info;
char type_name[1];
};
struct source_location
{
FAR const char *file_name;
union
{
unsigned long reported;
struct
{
uint32_t line;
uint32_t column;
};
};
};
struct overflow_data
{
struct source_location location;
FAR struct type_descriptor *type;
};
struct type_mismatch_data
{
struct source_location location;
FAR struct type_descriptor *type;
unsigned long alignment;
unsigned char type_check_kind;
};
struct type_mismatch_data_v1
{
struct source_location location;
FAR struct type_descriptor *type;
unsigned char log_alignment;
unsigned char type_check_kind;
};
struct type_mismatch_data_common
{
FAR struct source_location *location;
FAR struct type_descriptor *type;
unsigned long alignment;
unsigned char type_check_kind;
};
struct nonnull_arg_data
{
struct source_location location;
struct source_location attr_location;
int arg_index;
};
struct out_of_bounds_data
{
struct source_location location;
FAR struct type_descriptor *array_type;
FAR struct type_descriptor *index_type;
};
struct shift_out_of_bounds_data
{
struct source_location location;
FAR struct type_descriptor *lhs_type;
FAR struct type_descriptor *rhs_type;
};
struct invalid_value_data
{
struct source_location location;
FAR struct type_descriptor *type;
};
struct alignment_assumption_data
{
struct source_location location;
struct source_location assumption_location;
FAR struct type_descriptor *type;
};
#endif /* __MM_UBSAN_UBSAN_H */