Re: CFI violation in drivers/infiniband/core/sysfs.c

From: Nathan Chancellor
Date: Sat Apr 03 2021 - 02:56:08 EST


On Fri, Apr 02, 2021 at 04:03:30PM -0700, Kees Cook wrote:
> On Fri, Apr 02, 2021 at 12:52:41PM -0700, Nathan Chancellor wrote:
> > Hi all,
> >
> > I am testing the Clang Control Flow Integrity series that is being
> > worked on right now [1] and I encounter a violation in the Infiniband
> > sysfs core (drivers/infiniband/core/sysfs.c) on an arm64 server with mlx5:
> >
> > $ cat /sys/class/infiniband/mlx5_bond_0/ports/1/hw_counters/lifespan
> > 12
> >
> > $ echo "10" | sudo tee /sys/class/infiniband/mlx5_bond_0/ports/1/hw_counters/lifespan
> > 10
> >
> > $ sudo dmesg
> > [64198.670342] ------------[ cut here ]------------
> > [64198.670362] CFI failure (target: show_stats_lifespan+0x0/0x8 [ib_core]):
> > [64198.671291] WARNING: CPU: 20 PID: 15786 at kernel/cfi.c:29 __ubsan_handle_cfi_check_fail+0x58/0x60
> > [64198.671336] Modules linked in: binfmt_misc nls_iso8859_1 dm_multipath
> > scsi_dh_rdac scsi_dh_emc scsi_dh_alua ast drm_vram_helper drm_ttm_helper
> > ttm aes_ce_blk crypto_simd drm_kms_helper cryptd cec rc_core
> > aes_ce_cipher crct10dif_ce sysimgblt ghash_ce syscopyarea sysfillrect
> > acpi_ipmi sha2_ce fb_sys_fops ipmi_ssif sha256_arm64 ipmi_devintf
> > sha1_ce drm efi_pstore sbsa_gwdt tcp_westwood evbug ipmi_msghandler
> > cppc_cpufreq xgene_hwmon ib_iser rdma_cm iw_cm ib_cm iscsi_tcp
> > libiscsi_tcp libiscsi scsi_transport_iscsi bonding ip_tables x_tables
> > autofs4 raid10 raid456 libcrc32c async_raid6_recov async_pq raid6_pq
> > async_xor xor xor_neon async_memcpy async_tx raid1 raid0 multipath
> > linear mlx5_ib ib_uverbs ib_core mlx5_core mlxfw igb i2c_algo_bit tls
> > i2c_xgene_slimpro ahci_platform gpio_dwapb
> > [64198.671958] CPU: 20 PID: 15786 Comm: cat Tainted: G W 5.12.0-rc5+ #5
> > [64198.671980] Hardware name: Lenovo HR330A 7X33CTO1WW /HR350A , BIOS HVE104D-1.02 03/08/2019
> > [64198.671993] pstate: 60400005 (nZCv daif +PAN -UAO -TCO BTYPE=--)
> > [64198.672016] pc : __ubsan_handle_cfi_check_fail+0x58/0x60
> > [64198.672036] lr : __ubsan_handle_cfi_check_fail+0x58/0x60
> > [64198.672054] sp : ffff800014ea3b50
> > [64198.672065] x29: ffff800014ea3b50 x28: ffff80001122da60
> > [64198.672095] x27: ffff80001122ad80 x26: ffff800011233088
> > [64198.672122] x25: ffff000801821a78 x24: ffff000820cda200
> > [64198.672148] x23: ffff800009aa9f60 x22: ffff800009a66000
> > [64198.672173] x21: 7dac81f92e1d85cf x20: ffff800009abddd0
> > [64198.672198] x19: ffff800009a69fd8 x18: ffffffffffffffff
> > [64198.672223] x17: 0000000000000000 x16: 0000000000000000
> > [64198.672250] x15: 0000000000000004 x14: 0000000000001fff
> > [64198.672277] x13: ffff8000121412a8 x12: 0000000000000003
> > [64198.672303] x11: 0000000000000000 x10: 0000000000000027
> > [64198.672329] x9 : 4568e3af67e9f000 x8 : 4568e3af67e9f000
> > [64198.672356] x7 : 6e6170736566696c x6 : ffff8000124699c9
> > [64198.672381] x5 : 0000000000000000 x4 : 0000000000000001
> > [64198.672406] x3 : 0000000000000000 x2 : 0000000000000000
> > [64198.672431] x1 : ffff8000119b905d x0 : 000000000000003c
> > [64198.672457] Call trace:
> > [64198.672469] __ubsan_handle_cfi_check_fail+0x58/0x60
> > [64198.672489] __cfi_check_fail+0x3c/0x44 [ib_core]
> > [64198.673362] __cfi_check+0x2e78/0x31b0 [ib_core]
> > [64198.674230] port_attr_show+0x88/0x98 [ib_core]
> > [64198.675098] sysfs_kf_seq_show+0xc4/0x160
> > [64198.675131] kernfs_seq_show+0x5c/0xa4
> > [64198.675157] seq_read_iter+0x178/0x60c
> > [64198.675176] kernfs_fop_read_iter+0x78/0x1fc
> > [64198.675202] vfs_read+0x2d0/0x34c
> > [64198.675220] ksys_read+0x80/0xec
> > [64198.675237] __arm64_sys_read+0x28/0x34
> > [64198.675253] el0_svc_common.llvm.13467398108545334879+0xbc/0x1f0
> > [64198.675277] do_el0_svc+0x30/0xa4
> > [64198.675293] el0_svc+0x30/0xb0
> > [64198.675314] el0_sync_handler+0x84/0xe4
> > [64198.675333] el0_sync+0x174/0x180
> > [64198.675351] ---[ end trace a253e31759778f5c ]---
> > [64216.024673] ------------[ cut here ]------------
> > [64216.024678] CFI failure (target: set_stats_lifespan+0x0/0x8 [ib_core]):
> > [64216.024824] WARNING: CPU: 3 PID: 15816 at kernel/cfi.c:29 __ubsan_handle_cfi_check_fail+0x58/0x60
> > [64216.024832] Modules linked in: binfmt_misc nls_iso8859_1 dm_multipath
> > scsi_dh_rdac scsi_dh_emc scsi_dh_alua ast drm_vram_helper drm_ttm_helper
> > ttm aes_ce_blk crypto_simd drm_kms_helper cryptd cec rc_core
> > aes_ce_cipher crct10dif_ce sysimgblt ghash_ce syscopyarea sysfillrect
> > acpi_ipmi sha2_ce fb_sys_fops ipmi_ssif sha256_arm64 ipmi_devintf
> > sha1_ce drm efi_pstore sbsa_gwdt tcp_westwood evbug ipmi_msghandler
> > cppc_cpufreq xgene_hwmon ib_iser rdma_cm iw_cm ib_cm iscsi_tcp
> > libiscsi_tcp libiscsi scsi_transport_iscsi bonding ip_tables x_tables
> > autofs4 raid10 raid456 libcrc32c async_raid6_recov async_pq raid6_pq
> > async_xor xor xor_neon async_memcpy async_tx raid1 raid0 multipath
> > linear mlx5_ib ib_uverbs ib_core mlx5_core mlxfw igb i2c_algo_bit tls
> > i2c_xgene_slimpro ahci_platform gpio_dwapb
> > [64216.024922] CPU: 3 PID: 15816 Comm: tee Tainted: G W 5.12.0-rc5+ #5
> > [64216.024925] Hardware name: Lenovo HR330A 7X33CTO1WW /HR350A , BIOS HVE104D-1.02 03/08/2019
> > [64216.024927] pstate: 60400005 (nZCv daif +PAN -UAO -TCO BTYPE=--)
> > [64216.024931] pc : __ubsan_handle_cfi_check_fail+0x58/0x60
> > [64216.024933] lr : __ubsan_handle_cfi_check_fail+0x58/0x60
> > [64216.024936] sp : ffff800015433bf0
> > [64216.024938] x29: ffff800015433bf0 x28: ffff000808a00000
> > [64216.024942] x27: 0000000000000000 x26: 0000000000000000
> > [64216.024945] x25: ffff0008062e5000 x24: ffff000808a00000
> > [64216.024949] x23: ffff000825ba9600 x22: ffff800009a66000
> > [64216.024952] x21: 6d3b10b5d517da5b x20: ffff800009abddf0
> > [64216.024956] x19: ffff800009a69fb8 x18: ffffffffffffffff
> > [64216.024959] x17: 0000000000000000 x16: 0000000000000000
> > [64216.024962] x15: 0000000000000004 x14: 0000000000001fff
> > [64216.024966] x13: ffff8000121412a8 x12: 0000000000000003
> > [64216.024969] x11: 0000000000000000 x10: 0000000000000027
> > [64216.024973] x9 : 4568e3af67e9f000 x8 : 4568e3af67e9f000
> > [64216.024976] x7 : 2b6e617073656669 x6 : ffff8000124699c8
> > [64216.024979] x5 : 0000000000000000 x4 : 0000000000000001
> > [64216.024983] x3 : 0000000000000000 x2 : 0000000000000000
> > [64216.024986] x1 : ffff8000119b905d x0 : 000000000000003b
> > [64216.024990] Call trace:
> > [64216.024992] __ubsan_handle_cfi_check_fail+0x58/0x60
> > [64216.024995] __cfi_check_fail+0x3c/0x44 [ib_core]
> > [64216.025133] __cfi_check+0x2e78/0x31b0 [ib_core]
> > [64216.025277] port_attr_store+0x5c/0x90 [ib_core]
> > [64216.025422] sysfs_kf_write+0x70/0xd0
> > [64216.025428] kernfs_fop_write_iter+0x110/0x1dc
> > [64216.025431] vfs_write+0x364/0x46c
> > [64216.025435] ksys_write+0x80/0xec
> > [64216.025437] __arm64_sys_write+0x28/0x34
> > [64216.025439] el0_svc_common.llvm.13467398108545334879+0xbc/0x1f0
> > [64216.025443] do_el0_svc+0x30/0xa4
> > [64216.025445] el0_svc+0x30/0xb0
> > [64216.025450] el0_sync_handler+0x84/0xe4
> > [64216.025452] el0_sync+0x174/0x180
> > [64216.025455] ---[ end trace a253e31759778f5d ]---
> >
> > According to the call trace, sysfs_kf_seq_show() calls port_attr_show()
> > because that is the show() member of port_sysfs_ops and port_attr_show()
> > calls show_stats_lifespan() via an indirect call (port_attr->show()).
> > The show() member of 'struct port_attribute' is:
> >
> > ssize_t (*show)(struct ib_port *, struct port_attribute *, char *buf);
> >
> > but show_stats_lifespan() is defined to be the show() member of
> > 'struct hw_stats_attribute', which is of type
> >
> > ssize_t (*show)(struct kobject *kobj, struct attribute *attr, char *buf);
> >
> > so there is a mismatch and the CFI code warns about it. The store
> > functions have the same issue as you can see above.
> >
> > I have been trying to work my way through the code in order to suggest a
> > solution and I am getting lost hence my report. I think the issue is
> > that the hw_counters folder in sysfs is a 'struct attribute_group',
> > which gets added underneath the 'struct ib_ports' kobj in add_port(),
> > meaning that it inherits the sysfs ops from the 'struct ib_ports' kobj,
> > which are port_attr_{show,store}(). Initially, I though that
> > 'struct hw_stats_attribute' could just be converted over to
> > 'struct port_attribute' but it seems 'struct hw_stats_attribute' does
> > not have to be used underneath 'struct ib_port', it can be underneath
> > 'struct ib_device', where 'struct port_attribute' is not going to be
> > relevant. It seems to me that the hw_counters 'struct attribute_group'
> > should probably be its own kobj within both of these structures so they
> > can have their own sysfs ops (unless there is some other way to do this
> > that I am missing).
>
> Owwww. Yeah, I agree with your evaluation.
>
> > I would appreciate someone else taking a look and seeing if I am off
> > base or if there is an easier way to solve this.
>
> So, it seems that the reason for a custom kobj_type here is to use the
> .release callback. That can't be done without also specifying the ops,
> but the "default" sysfs ops aren't exported. Most sysfs users aren't
> allocating their attributes (they're static .data). (Though if this
> becomes a common pattern, perhaps we should export the default sysfs ops
> for users to override the .release callback without needing to specify a
> show wrapper.)
>
> So, I think, the solution is below. This hasn't been runtime tested. It
> basically removes the ib_port callback prototype and leaves everything
> as kobject/attr. The callbacks then do their own container_of() calls.

Well that appear to be okay from a runtime perspective.

$ cat /sys/class/infiniband/mlx5_bond_0/ports/1/hw_counters/lifespan
12

and there is no stacktrace (from that function at least, I found a
couple more violations that I will send patches for). If you decide to
formally send it, you can stick a

Tested-by: Nathan Chancellor <nathan@xxxxxxxxxx>

on it.

Cheers!

> diff --git a/drivers/infiniband/core/sysfs.c b/drivers/infiniband/core/sysfs.c
> index b8abb30f80df..2c68bb8c6e08 100644
> --- a/drivers/infiniband/core/sysfs.c
> +++ b/drivers/infiniband/core/sysfs.c
> @@ -67,14 +67,11 @@ struct ib_port {
>
> struct port_attribute {
> struct attribute attr;
> - ssize_t (*show)(struct ib_port *, struct port_attribute *, char *buf);
> - ssize_t (*store)(struct ib_port *, struct port_attribute *,
> + ssize_t (*show)(struct kobject *, struct attribute *, char *buf);
> + ssize_t (*store)(struct kobject *, struct attribute *,
> const char *buf, size_t count);
> };
>
> -#define PORT_ATTR(_name, _mode, _show, _store) \
> -struct port_attribute port_attr_##_name = __ATTR(_name, _mode, _show, _store)
> -
> #define PORT_ATTR_RO(_name) \
> struct port_attribute port_attr_##_name = __ATTR_RO(_name)
>
> @@ -102,12 +99,11 @@ static ssize_t port_attr_show(struct kobject *kobj,
> {
> struct port_attribute *port_attr =
> container_of(attr, struct port_attribute, attr);
> - struct ib_port *p = container_of(kobj, struct ib_port, kobj);
>
> if (!port_attr->show)
> return -EIO;
>
> - return port_attr->show(p, port_attr, buf);
> + return port_attr->show(kobj, attr, buf);
> }
>
> static ssize_t port_attr_store(struct kobject *kobj,
> @@ -116,11 +112,10 @@ static ssize_t port_attr_store(struct kobject *kobj,
> {
> struct port_attribute *port_attr =
> container_of(attr, struct port_attribute, attr);
> - struct ib_port *p = container_of(kobj, struct ib_port, kobj);
>
> if (!port_attr->store)
> return -EIO;
> - return port_attr->store(p, port_attr, buf, count);
> + return port_attr->store(kobj, attr, buf, count);
> }
>
> static const struct sysfs_ops port_sysfs_ops = {
> @@ -133,22 +128,21 @@ static ssize_t gid_attr_show(struct kobject *kobj,
> {
> struct port_attribute *port_attr =
> container_of(attr, struct port_attribute, attr);
> - struct ib_port *p = container_of(kobj, struct gid_attr_group,
> - kobj)->port;
>
> if (!port_attr->show)
> return -EIO;
>
> - return port_attr->show(p, port_attr, buf);
> + return port_attr->show(kobj, attr, buf);
> }
>
> static const struct sysfs_ops gid_attr_sysfs_ops = {
> .show = gid_attr_show
> };
>
> -static ssize_t state_show(struct ib_port *p, struct port_attribute *unused,
> +static ssize_t state_show(struct kobject *kobj, struct attribute *unused,
> char *buf)
> {
> + struct ib_port *p = container_of(kobj, struct ib_port, kobj);
> struct ib_port_attr attr;
> ssize_t ret;
>
> @@ -172,9 +166,10 @@ static ssize_t state_show(struct ib_port *p, struct port_attribute *unused,
> "UNKNOWN");
> }
>
> -static ssize_t lid_show(struct ib_port *p, struct port_attribute *unused,
> +static ssize_t lid_show(struct kobject *kobj, struct attribute *unused,
> char *buf)
> {
> + struct ib_port *p = container_of(kobj, struct ib_port, kobj);
> struct ib_port_attr attr;
> ssize_t ret;
>
> @@ -185,10 +180,11 @@ static ssize_t lid_show(struct ib_port *p, struct port_attribute *unused,
> return sysfs_emit(buf, "0x%x\n", attr.lid);
> }
>
> -static ssize_t lid_mask_count_show(struct ib_port *p,
> - struct port_attribute *unused,
> +static ssize_t lid_mask_count_show(struct kobject *kobj,
> + struct attribute *unused,
> char *buf)
> {
> + struct ib_port *p = container_of(kobj, struct ib_port, kobj);
> struct ib_port_attr attr;
> ssize_t ret;
>
> @@ -199,9 +195,10 @@ static ssize_t lid_mask_count_show(struct ib_port *p,
> return sysfs_emit(buf, "%d\n", attr.lmc);
> }
>
> -static ssize_t sm_lid_show(struct ib_port *p, struct port_attribute *unused,
> +static ssize_t sm_lid_show(struct kobject *kobj, struct attribute *unused,
> char *buf)
> {
> + struct ib_port *p = container_of(kobj, struct ib_port, kobj);
> struct ib_port_attr attr;
> ssize_t ret;
>
> @@ -212,9 +209,10 @@ static ssize_t sm_lid_show(struct ib_port *p, struct port_attribute *unused,
> return sysfs_emit(buf, "0x%x\n", attr.sm_lid);
> }
>
> -static ssize_t sm_sl_show(struct ib_port *p, struct port_attribute *unused,
> +static ssize_t sm_sl_show(struct kobject *kobj, struct attribute *unused,
> char *buf)
> {
> + struct ib_port *p = container_of(kobj, struct ib_port, kobj);
> struct ib_port_attr attr;
> ssize_t ret;
>
> @@ -225,9 +223,10 @@ static ssize_t sm_sl_show(struct ib_port *p, struct port_attribute *unused,
> return sysfs_emit(buf, "%d\n", attr.sm_sl);
> }
>
> -static ssize_t cap_mask_show(struct ib_port *p, struct port_attribute *unused,
> +static ssize_t cap_mask_show(struct kobject *kobj, struct attribute *unused,
> char *buf)
> {
> + struct ib_port *p = container_of(kobj, struct ib_port, kobj);
> struct ib_port_attr attr;
> ssize_t ret;
>
> @@ -238,9 +237,10 @@ static ssize_t cap_mask_show(struct ib_port *p, struct port_attribute *unused,
> return sysfs_emit(buf, "0x%08x\n", attr.port_cap_flags);
> }
>
> -static ssize_t rate_show(struct ib_port *p, struct port_attribute *unused,
> +static ssize_t rate_show(struct kobject *kobj, struct attribute *unused,
> char *buf)
> {
> + struct ib_port *p = container_of(kobj, struct ib_port, kobj);
> struct ib_port_attr attr;
> char *speed = "";
> int rate; /* in deci-Gb/sec */
> @@ -313,9 +313,10 @@ static const char *phys_state_to_str(enum ib_port_phys_state phys_state)
> return "<unknown>";
> }
>
> -static ssize_t phys_state_show(struct ib_port *p, struct port_attribute *unused,
> +static ssize_t phys_state_show(struct kobject *kobj, struct attribute *unused,
> char *buf)
> {
> + struct ib_port *p = container_of(kobj, struct ib_port, kobj);
> struct ib_port_attr attr;
>
> ssize_t ret;
> @@ -328,9 +329,10 @@ static ssize_t phys_state_show(struct ib_port *p, struct port_attribute *unused,
> phys_state_to_str(attr.phys_state));
> }
>
> -static ssize_t link_layer_show(struct ib_port *p, struct port_attribute *unused,
> +static ssize_t link_layer_show(struct kobject *kobj, struct attribute *unused,
> char *buf)
> {
> + struct ib_port *p = container_of(kobj, struct ib_port, kobj);
> const char *output;
>
> switch (rdma_port_get_link_layer(p->ibdev, p->port_num)) {
> @@ -391,11 +393,9 @@ static ssize_t print_gid_type(const struct ib_gid_attr *gid_attr, char *buf)
> }
>
> static ssize_t _show_port_gid_attr(
> - struct ib_port *p, struct port_attribute *attr, char *buf,
> + struct ib_port *p, struct port_table_attribute *tab_attr, char *buf,
> ssize_t (*print)(const struct ib_gid_attr *gid_attr, char *buf))
> {
> - struct port_table_attribute *tab_attr =
> - container_of(attr, struct port_table_attribute, attr);
> const struct ib_gid_attr *gid_attr;
> ssize_t ret;
>
> @@ -409,11 +409,12 @@ static ssize_t _show_port_gid_attr(
> return ret;
> }
>
> -static ssize_t show_port_gid(struct ib_port *p, struct port_attribute *attr,
> +static ssize_t show_port_gid(struct kobject *kobj, struct attribute *attr,
> char *buf)
> {
> + struct ib_port *p = container_of(kobj, struct ib_port, kobj);
> struct port_table_attribute *tab_attr =
> - container_of(attr, struct port_table_attribute, attr);
> + container_of(attr, struct port_table_attribute, attr.attr);
> const struct ib_gid_attr *gid_attr;
> int len;
>
> @@ -438,24 +439,31 @@ static ssize_t show_port_gid(struct ib_port *p, struct port_attribute *attr,
> return len;
> }
>
> -static ssize_t show_port_gid_attr_ndev(struct ib_port *p,
> - struct port_attribute *attr, char *buf)
> +static ssize_t show_port_gid_attr_ndev(struct kobject *kobj,
> + struct attribute *attr, char *buf)
> {
> - return _show_port_gid_attr(p, attr, buf, print_ndev);
> + struct ib_port *p = container_of(kobj, struct ib_port, kobj);
> + struct port_table_attribute *tab_attr =
> + container_of(attr, struct port_table_attribute, attr.attr);
> + return _show_port_gid_attr(p, tab_attr, buf, print_ndev);
> }
>
> -static ssize_t show_port_gid_attr_gid_type(struct ib_port *p,
> - struct port_attribute *attr,
> +static ssize_t show_port_gid_attr_gid_type(struct kobject *kobj,
> + struct attribute *attr,
> char *buf)
> {
> - return _show_port_gid_attr(p, attr, buf, print_gid_type);
> + struct ib_port *p = container_of(kobj, struct ib_port, kobj);
> + struct port_table_attribute *tab_attr =
> + container_of(attr, struct port_table_attribute, attr.attr);
> + return _show_port_gid_attr(p, tab_attr, buf, print_gid_type);
> }
>
> -static ssize_t show_port_pkey(struct ib_port *p, struct port_attribute *attr,
> +static ssize_t show_port_pkey(struct kobject *kobj, struct attribute *attr,
> char *buf)
> {
> + struct ib_port *p = container_of(kobj, struct ib_port, kobj);
> struct port_table_attribute *tab_attr =
> - container_of(attr, struct port_table_attribute, attr);
> + container_of(attr, struct port_table_attribute, attr.attr);
> u16 pkey;
> int ret;
>
> @@ -528,11 +536,12 @@ static int get_perf_mad(struct ib_device *dev, int port_num, __be16 attr,
> return ret;
> }
>
> -static ssize_t show_pma_counter(struct ib_port *p, struct port_attribute *attr,
> +static ssize_t show_pma_counter(struct kobject *kobj, struct attribute *attr,
> char *buf)
> {
> + struct ib_port *p = container_of(kobj, struct ib_port, kobj);
> struct port_table_attribute *tab_attr =
> - container_of(attr, struct port_table_attribute, attr);
> + container_of(attr, struct port_table_attribute, attr.attr);
> int offset = tab_attr->index & 0xffff;
> int width = (tab_attr->index >> 16) & 0xff;
> int ret;
> @@ -745,8 +754,8 @@ static struct kobj_type gid_attr_type = {
> };
>
> static struct attribute **
> -alloc_group_attrs(ssize_t (*show)(struct ib_port *,
> - struct port_attribute *, char *buf),
> +alloc_group_attrs(ssize_t (*show)(struct kobject *,
> + struct attribute *, char *buf),
> int len)
> {
> struct attribute **tab_attr;
>
> --
> Kees Cook