On Thu, Jan 14, 2021 at 12:29:28PM -0500, Brian Foster wrote: > On Thu, Jan 14, 2021 at 05:20:29AM -0500, Yumei Huang wrote: > > Hit the issue when doing syzkaller test with kernel 5.11.0-rc3(65f0d241). The C reproducer is attached. > > > > Steps to Reproduce: > > 1. # gcc -pthread -o reproducer reproducer.c > > 2. # ./reproducer > > > > > > Test results: > > [ 131.726790] XFS: Assertion failed: (iattr->ia_valid & (ATTR_UID|ATTR_GID|ATTR_ATIME|ATTR_ATIME_SET| ATTR_MTIME_SET|ATTR_KILL_PRIV|ATTR_TIMES_SET)) == 0, file: fs/xfs/xfs_iops.c, line: 849 > > [ 131.743687] ------------[ cut here ]------------ > > Some quick initial analysis from a run of the reproducer... It looks > like it calls into xfs_setattr_size() with ATTR_KILL_PRIV set in > ->ia_valid. This appears to originate in the VFS via handle_truncate() > -> do_truncate() -> dentry_needs_remove_privs(). > > An strace of the reproducer shows the following calls: > > ... > [pid 1524] creat("./file0", 010) = 3 > ... > [pid 1524] fsetxattr(3, "security.capability", "\0\0\0\3b\27\0\0\10\0\0\0\2\0\0\0\377\377\377\377\0\356\0", 24, 0 <unfinished ...> > ... > [pid 1524] creat("./file0", 010 <unfinished ...> > ... > > So I'm guessing there's an attempt to open this file with O_TRUNC with > this particular xattr set (unexpectedly?). Indeed, after the reproducer > leaves file01 around with the xattr, a subsequent xfs_io -c "open -t > ..." attempt triggers the assert again, and then the xattr disappears. > I'd have to dig more into the associated vfs code to grok the expected > behavior and whether there's a problem here.. > The reproducer seems to boil down to this: touch <file> setfattr -n security.capability -v 0sAAAAA2IXAAAIAAAAAgAAAP////8A7gAA <file> xfs_io -c "open -t <file>" ... and afaict, the behavior is as expected. do_truncate() sets ATTR_KILL_PRIV via dentry_needs_remove_privs() and calls into notify_change(). That eventually gets to xfs_vn_setattr_size(), which calls xfs_vn_change_ok() -> setattr_prepare(). setattr_prepare() handles ATTR_KILL_PRIV (which remains set in ->ia_valid), and then we return, fall into xfs_setattr_size() and that triggers the assert failure. ISTM we should probably just drop ATTR_KILL_PRIV from the assert. Brian > Brian > > > [ 131.748350] WARNING: CPU: 18 PID: 1786 at fs/xfs/xfs_message.c:97 asswarn+0x1a/0x1d [xfs] > > [ 131.756764] Modules linked in: intel_rapl_msr intel_rapl_common edac_mce_amd kvm_amd rfkill kvm irqbypass mgag200 crct10dif_pclmul i2c_algo_bit drm_kms_helper syscopyarea sysfillrect sysimgblt fb_sys_fops crc32_pclmul ccp sp5100_tco drm ipmi_ssif ses ghash_clmulni_intel pcspkr hpilo acpi_ipmi enclosure hpwdt i2c_piix4 k10temp rapl ipmi_si ipmi_devintf ipmi_msghandler acpi_tad acpi_cpufreq ip_tables xfs libcrc32c sd_mod t10_pi sg uas crc32c_intel serio_raw usb_storage smartpqi scsi_transport_sas tg3 wmi dm_mirror dm_region_hash dm_log dm_mod > > [ 131.805054] CPU: 18 PID: 1786 Comm: reproducer Tainted: G B 5.11.0-rc3upstream65f0d241+ #2 > > [ 131.814702] Hardware name: HPE ProLiant DL385 Gen10/ProLiant DL385 Gen10, BIOS A40 10/14/2017 > > [ 131.823299] RIP: 0010:asswarn+0x1a/0x1d [xfs] > > [ 131.827868] Code: c4 d0 00 00 00 5b 41 5c 41 5d 41 5e 41 5f 5d c3 0f 1f 44 00 00 41 89 c8 48 89 d1 48 89 f2 48 c7 c6 40 d6 ad c0 e8 08 fa ff ff <0f> 0b c3 0f 1f 44 00 00 53 41 89 c8 48 89 d1 48 89 f2 48 c7 c6 40 > > [ 131.846777] RSP: 0018:ffff88812128f828 EFLAGS: 00010282 > > [ 131.852059] RAX: 0000000000000000 RBX: 1ffff11024251f0b RCX: 0000000000000000 > > [ 131.859256] RDX: dffffc0000000000 RSI: 000000000000000a RDI: ffffed1024251ef7 > > [ 131.866458] RBP: ffff88812128f920 R08: ffffed110dcfe24d R09: ffffed110dcfe24d > > [ 131.873663] R10: ffff88886e7f1267 R11: ffffed110dcfe24c R12: ffff88812128fa68 > > [ 131.880862] R13: ffff88819bf08280 R14: ffff88819bf08280 R15: ffff88819bf08000 > > [ 131.888062] FS: 00007f18cb349700(0000) GS:ffff88886e600000(0000) knlGS:0000000000000000 > > [ 131.896222] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 > > [ 131.902026] CR2: 0000000020000100 CR3: 0000000112820000 CR4: 00000000003506e0 > > [ 131.909223] Call Trace: > > [ 131.911703] xfs_setattr_size+0x742/0xd00 [xfs] > > [ 131.916427] ? __vfs_removexattr+0xd1/0x130 > > [ 131.920673] ? xfs_setattr_nonsize+0xef0/0xef0 [xfs] > > [ 131.925836] ? cap_inode_killpriv+0x11/0x20 > > [ 131.930071] ? security_inode_killpriv+0x3f/0x70 > > [ 131.934740] xfs_vn_setattr+0xea/0x3a0 [xfs] > > [ 131.939211] ? xfs_vn_setattr_size+0x2a0/0x2a0 [xfs] > > [ 131.944375] notify_change+0x744/0xda0 > > [ 131.948173] ? do_truncate+0xe2/0x180 > > [ 131.951880] do_truncate+0xe2/0x180 > > [ 131.955412] ? __x64_sys_openat2+0x1c0/0x1c0 > > [ 131.959731] ? ima_file_check+0xd9/0x120 > > [ 131.963701] ? security_inode_permission+0x79/0xc0 > > [ 131.968545] path_openat+0x11df/0x21f0 > > [ 131.972340] ? path_lookupat.isra.48+0x440/0x440 > > [ 131.977012] ? quarantine_put+0xe2/0x170 > > [ 131.980979] ? trace_hardirqs_on+0x1c/0x150 > > [ 131.985211] do_filp_open+0x176/0x250 > > [ 131.988915] ? lock_release+0x56e/0xcc0 > > [ 131.992797] ? may_open_dev+0xc0/0xc0 > > [ 131.996503] ? do_raw_spin_unlock+0x54/0x230 > > [ 132.000827] do_sys_openat2+0x2ee/0x5c0 > > [ 132.004710] ? rcu_read_unlock+0x50/0x50 > > [ 132.008676] ? file_open_root+0x210/0x210 > > [ 132.012732] ? ktime_get_coarse_real_ts64+0x122/0x150 > > [ 132.017840] do_sys_open+0x8a/0xd0 > > [ 132.021284] ? filp_open+0x50/0x50 > > [ 132.024730] ? syscall_trace_enter.isra.16+0x18e/0x250 > > [ 132.029923] do_syscall_64+0x33/0x40 > > [ 132.033543] entry_SYSCALL_64_after_hwframe+0x44/0xa9 > > [ 132.038647] RIP: 0033:0x7f18cac3c51d > > [ 132.042266] Code: 00 c3 66 2e 0f 1f 84 00 00 00 00 00 90 f3 0f 1e fa 48 89 f8 48 89 f7 48 89 d6 48 89 ca 4d 89 c2 4d 89 c8 4c 8b 4c 24 08 0f 05 <48> 3d 01 f0 ff ff 73 01 c3 48 8b 0d 3b 79 2c 00 f7 d8 64 89 01 48 > > [ 132.061173] RSP: 002b:00007f18cb348e98 EFLAGS: 00000246 ORIG_RAX: 0000000000000055 > > [ 132.068817] RAX: ffffffffffffffda RBX: 0000000000000000 RCX: 00007f18cac3c51d > > [ 132.076013] RDX: 0030656c69662f2e RSI: 0000000000000008 RDI: 0000000020000100 > > [ 132.083209] RBP: 00007f18cb348ec0 R08: 0000000000000000 R09: 0000000000000000 > > [ 132.090407] R10: 0000000000000000 R11: 0000000000000246 R12: 00007fff50ae2e4e > > [ 132.097607] R13: 00007fff50ae2e4f R14: 00007fff50ae2ee0 R15: 00007f18cb348fc0 > > [ 132.104812] irq event stamp: 0 > > [ 132.107902] hardirqs last enabled at (0): [<0000000000000000>] 0x0 > > [ 132.114228] hardirqs last disabled at (0): [<ffffffff9c1ce85b>] copy_process+0x1a7b/0x6590 > > [ 132.122570] softirqs last enabled at (0): [<ffffffff9c1ce89f>] copy_process+0x1abf/0x6590 > > [ 132.130905] softirqs last disabled at (0): [<0000000000000000>] 0x0 > > [ 132.137235] ---[ end trace d05db93236ee9da5 ]--- > > > > > > Syzkaller reproducer: > > # {Threaded:true Collide:true Repeat:false RepeatTimes:0 Procs:1 Slowdown:1 Sandbox: Fault:false FaultCall:-1 FaultNth:0 Leak:false NetInjection:false NetDevices:false NetReset:false Cgroups:false BinfmtMisc:false CloseFDs:false KCSAN:false DevlinkPCI:false USB:false VhciInjection:false Wifi:false Sysctl:false UseTmpDir:false HandleSegv:false Repro:false Trace:false} > > r0 = creat(&(0x7f0000000100)='./file0\x00', 0x8) > > fsetxattr$security_capability(r0, &(0x7f0000000280)='security.capability\x00', &(0x7f00000002c0)=@v3={0x3000000, [{0x1762, 0x8}, {0x2, 0xffffffff}], 0xee00}, 0x18, 0x0) > > > > > > > > Best Regards, > > > > Yumei Huang > > > > > // autogenerated by syzkaller (https://github.com/google/syzkaller) > > > > #define _GNU_SOURCE > > > > #include <endian.h> > > #include <errno.h> > > #include <pthread.h> > > #include <stdint.h> > > #include <stdio.h> > > #include <stdlib.h> > > #include <string.h> > > #include <sys/syscall.h> > > #include <sys/types.h> > > #include <time.h> > > #include <unistd.h> > > > > #include <linux/futex.h> > > > > static void sleep_ms(uint64_t ms) > > { > > usleep(ms * 1000); > > } > > > > static uint64_t current_time_ms(void) > > { > > struct timespec ts; > > if (clock_gettime(CLOCK_MONOTONIC, &ts)) > > exit(1); > > return (uint64_t)ts.tv_sec * 1000 + (uint64_t)ts.tv_nsec / 1000000; > > } > > > > static void thread_start(void* (*fn)(void*), void* arg) > > { > > pthread_t th; > > pthread_attr_t attr; > > pthread_attr_init(&attr); > > pthread_attr_setstacksize(&attr, 128 << 10); > > int i = 0; > > for (; i < 100; i++) { > > if (pthread_create(&th, &attr, fn, arg) == 0) { > > pthread_attr_destroy(&attr); > > return; > > } > > if (errno == EAGAIN) { > > usleep(50); > > continue; > > } > > break; > > } > > exit(1); > > } > > > > typedef struct { > > int state; > > } event_t; > > > > static void event_init(event_t* ev) > > { > > ev->state = 0; > > } > > > > static void event_reset(event_t* ev) > > { > > ev->state = 0; > > } > > > > static void event_set(event_t* ev) > > { > > if (ev->state) > > exit(1); > > __atomic_store_n(&ev->state, 1, __ATOMIC_RELEASE); > > syscall(SYS_futex, &ev->state, FUTEX_WAKE | FUTEX_PRIVATE_FLAG, 1000000); > > } > > > > static void event_wait(event_t* ev) > > { > > while (!__atomic_load_n(&ev->state, __ATOMIC_ACQUIRE)) > > syscall(SYS_futex, &ev->state, FUTEX_WAIT | FUTEX_PRIVATE_FLAG, 0, 0); > > } > > > > static int event_isset(event_t* ev) > > { > > return __atomic_load_n(&ev->state, __ATOMIC_ACQUIRE); > > } > > > > static int event_timedwait(event_t* ev, uint64_t timeout) > > { > > uint64_t start = current_time_ms(); > > uint64_t now = start; > > for (;;) { > > uint64_t remain = timeout - (now - start); > > struct timespec ts; > > ts.tv_sec = remain / 1000; > > ts.tv_nsec = (remain % 1000) * 1000 * 1000; > > syscall(SYS_futex, &ev->state, FUTEX_WAIT | FUTEX_PRIVATE_FLAG, 0, &ts); > > if (__atomic_load_n(&ev->state, __ATOMIC_ACQUIRE)) > > return 1; > > now = current_time_ms(); > > if (now - start > timeout) > > return 0; > > } > > } > > > > struct thread_t { > > int created, call; > > event_t ready, done; > > }; > > > > static struct thread_t threads[16]; > > static void execute_call(int call); > > static int running; > > > > static void* thr(void* arg) > > { > > struct thread_t* th = (struct thread_t*)arg; > > for (;;) { > > event_wait(&th->ready); > > event_reset(&th->ready); > > execute_call(th->call); > > __atomic_fetch_sub(&running, 1, __ATOMIC_RELAXED); > > event_set(&th->done); > > } > > return 0; > > } > > > > static void loop(void) > > { > > int i, call, thread; > > int collide = 0; > > again: > > for (call = 0; call < 2; call++) { > > for (thread = 0; thread < (int)(sizeof(threads) / sizeof(threads[0])); thread++) { > > struct thread_t* th = &threads[thread]; > > if (!th->created) { > > th->created = 1; > > event_init(&th->ready); > > event_init(&th->done); > > event_set(&th->done); > > thread_start(thr, th); > > } > > if (!event_isset(&th->done)) > > continue; > > event_reset(&th->done); > > th->call = call; > > __atomic_fetch_add(&running, 1, __ATOMIC_RELAXED); > > event_set(&th->ready); > > if (collide && (call % 2) == 0) > > break; > > event_timedwait(&th->done, 50); > > break; > > } > > } > > for (i = 0; i < 100 && __atomic_load_n(&running, __ATOMIC_RELAXED); i++) > > sleep_ms(1); > > if (!collide) { > > collide = 1; > > goto again; > > } > > } > > > > uint64_t r[1] = {0xffffffffffffffff}; > > > > void execute_call(int call) > > { > > intptr_t res = 0; > > switch (call) { > > case 0: > > memcpy((void*)0x20000100, "./file0\000", 8); > > res = syscall(__NR_creat, 0x20000100ul, 8ul); > > if (res != -1) > > r[0] = res; > > break; > > case 1: > > memcpy((void*)0x20000280, "security.capability\000", 20); > > *(uint32_t*)0x200002c0 = 0x3000000; > > *(uint32_t*)0x200002c4 = 0x1762; > > *(uint32_t*)0x200002c8 = 8; > > *(uint32_t*)0x200002cc = 2; > > *(uint32_t*)0x200002d0 = -1; > > *(uint32_t*)0x200002d4 = 0xee00; > > syscall(__NR_fsetxattr, r[0], 0x20000280ul, 0x200002c0ul, 0x18ul, 0ul); > > break; > > } > > > > } > > int main(void) > > { > > syscall(__NR_mmap, 0x1ffff000ul, 0x1000ul, 0ul, 0x32ul, -1, 0ul); > > syscall(__NR_mmap, 0x20000000ul, 0x1000000ul, 7ul, 0x32ul, -1, 0ul); > > syscall(__NR_mmap, 0x21000000ul, 0x1000ul, 0ul, 0x32ul, -1, 0ul); > > loop(); > > return 0; > > } >