本文为一个新手阅读ksu源码过程中的随笔，不足之处还请纠正

KernelSU 基于commit：cf0bb45f6b1b5275c040ff980e56cd630707cd04 (tag: v3.0.0)

‍

思维导图

KernelSU#

kernel部分#

各模块分析#

allowlist#

1
#ifndef __KSU_H_ALLOWLIST
2
#define __KSU_H_ALLOWLIST
3

4
#include <linux/types.h>
5
#include <linux/uidgid.h>
6
#include "app_profile.h"
7

8
#define PER_USER_RANGE 100000
9
#define FIRST_APPLICATION_UID 10000
10
#define LAST_APPLICATION_UID 19999
11
#define FIRST_ISOLATED_UID 99000
12
#define LAST_ISOLATED_UID 99999
13

14
void ksu_allowlist_init(void);//初始化allowlist链表
15

16
void ksu_allowlist_exit(void);//清理allowlist链表
17

18
void ksu_load_allow_list(void);//加载allowlist文件到链表，路径：/data/adb/ksu/.allowlist
19

20
void ksu_show_allow_list(void);//打印allowlist链表内容到日志
21

22
// Check if the uid is in allow list
23
bool __ksu_is_allow_uid(uid_t uid);
24
#define ksu_is_allow_uid(uid) unlikely(__ksu_is_allow_uid(uid))
25

26
// Check if the uid is in allow list, or current is ksu domain root
27
bool __ksu_is_allow_uid_for_current(uid_t uid);
28
#define ksu_is_allow_uid_for_current(uid) unlikely(__ksu_is_allow_uid_for_current(uid))
29

30
bool ksu_get_allow_list(int *array, int *length, bool allow);
31

32
void ksu_prune_allowlist(bool (*is_uid_exist)(uid_t, char *, void *), void *data);//清理无用的allowlist条目
33

34
bool ksu_get_app_profile(struct app_profile *);//获取指定uid的app profile
35
bool ksu_set_app_profile(struct app_profile *, bool persist);//设置指定uid的app profile
36

37
bool ksu_uid_should_umount(uid_t uid);//是否执行umount操作
38
struct root_profile *ksu_get_root_profile(uid_t uid);//获取授予root权限的app的app profile
39

40
static inline bool is_appuid(uid_t uid)
41
{
42
    uid_t appid = uid % PER_USER_RANGE;
43
    return appid >= FIRST_APPLICATION_UID && appid <= LAST_APPLICATION_UID;
44
}
45

46
static inline bool is_isolated_process(uid_t uid)
47
{
48
    uid_t appid = uid % PER_USER_RANGE;
49
    return appid >= FIRST_ISOLATED_UID && appid <= LAST_ISOLATED_UID;
50
}
51
#endif

这个模块是ksu权限管理的核心，实现了allow_list的管理

这之中主要使用了三种数据结构

1
struct perm_data {
2
    struct list_head list;
3
    struct app_profile profile;
4
};
5
static struct list_head allow_list;
6

7
static uint8_t allow_list_bitmap[PAGE_SIZE] __read_mostly __aligned(PAGE_SIZE);
8

9
static int allow_list_arr[PAGE_SIZE / sizeof(int)] __read_mostly;

数据结构	作用	特点
`allow_list_bitmap`	位图缓存。专门用于 UID < 32768 的普通应用。	查询速度 O(1) 。
`allow_list_arr`	数组缓存。专门用于 UID > 32768 的特殊应用（如多用户分身）。	查询速度 O(n) 。弥补位图范围的不足。
`allow_list`(链表)	完整数据库。存储所有的`app_profile`配置细节。	查询速度 O(n) 。存储全量信息。包含 UID、包名、SELinux 域、Capabilities 等所有细节。

前两者用于快速判定某个uid是否被manager配置（su, app_profile, umount）

allow_list这个链表存储了完整的app_profile信息，供其他模块调用获取某个uid的配置信息

app_sign#

1
#ifndef __KSU_H_APK_V2_SIGN
2
#define __KSU_H_APK_V2_SIGN
3

4
#include <linux/types.h>
5

6
bool is_manager_apk(char *path);
7

8
#endif

只有一个功能，根据传入的apk来判断其是否为官方manager

1
bool is_manager_apk(char *path)
2
{
3
    return check_v2_signature(path, EXPECTED_SIZE, EXPECTED_HASH);
4
}

1
static __always_inline bool check_v2_signature(char *path,
2
                           unsigned expected_size,
3
                           const char *expected_sha256)
4
{
5
    unsigned char buffer[0x11] = { 0 };
6
    u32 size4;
7
    u64 size8, size_of_block;
8

9
    loff_t pos;
10

11
    bool v2_signing_valid = false;
12
    int v2_signing_blocks = 0;
13
    bool v3_signing_exist = false;
14
    bool v3_1_signing_exist = false;
15
  /*
16
    ............
17
  */
18

19
    if (v2_signing_valid) {
20
        int has_v1_signing = has_v1_signature_file(fp);
21
        if (has_v1_signing) {
22
            pr_err("Unexpected v1 signature scheme found!\n");
23
            filp_close(fp, 0);
24
            return false;
25
        }
26
    }
27
clean:
28
    filp_close(fp, 0);
29

30
    if (v3_signing_exist || v3_1_signing_exist) {
31
#ifdef CONFIG_KSU_DEBUG
32
        pr_err("Unexpected v3 signature scheme found!\n");
33
#endif
34
        return false;
35
    }
36

37
    return v2_signing_valid;
38
}

仅允许v2签名存在，v1/v3/v3.1均会直接返回false

app_profile#

1
#ifndef __KSU_H_APP_PROFILE
2
#define __KSU_H_APP_PROFILE
3

4
#include <linux/types.h>
5

6
// Forward declarations
7
struct cred;
8

9
#define KSU_APP_PROFILE_VER 2
10
#define KSU_MAX_PACKAGE_NAME 256
11
// NGROUPS_MAX for Linux is 65535 generally, but we only supports 32 groups.
12
#define KSU_MAX_GROUPS 32
13
#define KSU_SELINUX_DOMAIN 64
14

15
struct root_profile {
16
  int32_t uid;
17
  int32_t gid;
18

19
  int32_t groups_count;
20
  int32_t groups[KSU_MAX_GROUPS];
21

22
  // kernel_cap_t is u32[2] for capabilities v3
23
  struct {
24
    u64 effective;
25
    u64 permitted;
26
    u64 inheritable;
27
  } capabilities;
28

29
  char selinux_domain[KSU_SELINUX_DOMAIN];
30

31
  int32_t namespaces;
32
};
33

34
struct non_root_profile {
35
  bool umount_modules;
36
};
37

38
struct app_profile {
39
  // It may be utilized for backward compatibility, although we have never explicitly made any promises regarding this.
40
  u32 version;
41

42
  // this is usually the package of the app, but can be other value for special apps
43
  char key[KSU_MAX_PACKAGE_NAME];
44
  int32_t current_uid;
45
  bool allow_su;
46

47
  union {
48
    struct {
49
      bool use_default;
50
      char template_name[KSU_MAX_PACKAGE_NAME];
51

52
      struct root_profile profile;
53
    } rp_config;
54

55
    struct {
56
      bool use_default;
57

58
      struct non_root_profile profile;
59
    } nrp_config;
60
  };
61
};
62

63
// Escalate current process to root with the appropriate profile
64
void escape_with_root_profile(void);
65

66
#endif

只有一个功能，将当前进程提权到 app_profile 中定义的权限

1
void escape_with_root_profile(void)
2
{
3
  struct cred *cred;
4
  struct task_struct *p = current;
5
  struct task_struct *t;
6

7
  cred = prepare_creds();
8
  if (!cred) {
9
    pr_warn("prepare_creds failed!\n");
10
    return;
11
  }
12

13
  if (cred->euid.val == 0) {
14
    pr_warn("Already root, don't escape!\n");
15
    abort_creds(cred);
16
    return;
17
  }
18

19
  struct root_profile *profile = ksu_get_root_profile(cred->uid.val);
20

21
  cred->uid.val = profile->uid;
22
  cred->suid.val = profile->uid;
23
  cred->euid.val = profile->uid;
24
  cred->fsuid.val = profile->uid;
25

26
  cred->gid.val = profile->gid;
27
  cred->fsgid.val = profile->gid;
28
  cred->sgid.val = profile->gid;
29
  cred->egid.val = profile->gid;
30
  cred->securebits = 0;
31

32
  BUILD_BUG_ON(sizeof(profile->capabilities.effective) !=
33
         sizeof(kernel_cap_t));
34

35
  // setup capabilities
36
  // we need CAP_DAC_READ_SEARCH becuase `/data/adb/ksud` is not accessible for non root process
37
  // we add it here but don't add it to cap_inhertiable, it would be dropped automaticly after exec!
38
  u64 cap_for_ksud = profile->capabilities.effective | CAP_DAC_READ_SEARCH;
39
  memcpy(&cred->cap_effective, &cap_for_ksud, sizeof(cred->cap_effective));
40
  memcpy(&cred->cap_permitted, &profile->capabilities.effective,
41
         sizeof(cred->cap_permitted));
42
  memcpy(&cred->cap_bset, &profile->capabilities.effective,
43
         sizeof(cred->cap_bset));
44

45
  setup_groups(profile, cred);
46

47
  commit_creds(cred);
48

49
  // Refer to kernel/seccomp.c: seccomp_set_mode_strict
50
  // When disabling Seccomp, ensure that current->sighand->siglock is held during the operation.
51
  spin_lock_irq(&current->sighand->siglock);
52
  disable_seccomp();
53
  spin_unlock_irq(&current->sighand->siglock);
54

55
  setup_selinux(profile->selinux_domain);
56

57
  for_each_thread (p, t) {
58
    ksu_set_task_tracepoint_flag(t);
59
  }
60
}

这实际突破了三种限制 传统 Linux 权限 Seccomp SELinux

传统linux权限#

设置uid / gid / group#

User identifier

设置为profile中定义的uid gid group

设置capabilities#

linux 安全特性 capability 能力级

设置为profile中定义的capabilities

这里有一处地方

1
  // we need CAP_DAC_READ_SEARCH becuase `/data/adb/ksud` is not accessible for non root process
2
  // we add it here but don't add it to cap_inhertiable, it would be dropped automaticly after exec!
3
  u64 cap_for_ksud = profile->capabilities.effective | CAP_DAC_READ_SEARCH;
4
  memcpy(&cred->cap_effective, &cap_for_ksud, sizeof(cred->cap_effective));

cap_dac_read_search 功能可让用户读取文件系统中的任意文件，包括 root 拥有的所有文件。

并且这里没有把cap_dac_read_search 加入 cap_inhertiable （可继承集合），这使得进程在运行 ksud 后即刻失去了cap_dac_read_search 能力

为什么要给进程添加`cap_dac_read_search` 能力？#

实际上 ksu hook了execve 这个系统调用，重定向 su 和 /system/bin/su 命令到了 /data/adb/ksud

而 ksu 引入了 app_profile 机制，提权后并不一定是root进程，所以必须添加 cap_dac_read_search 能力保证执行su的进程均能访问到/data/adb/ksud

详见syscall_hook_manager模块

Seccomp#

1
static void disable_seccomp(void)
2
{
3
  assert_spin_locked(&current->sighand->siglock);
4
  // disable seccomp
5
#if defined(CONFIG_GENERIC_ENTRY) &&                                           \
6
  LINUX_VERSION_CODE >= KERNEL_VERSION(5, 11, 0)
7
  clear_syscall_work(SECCOMP);
8
#else
9
  clear_thread_flag(TIF_SECCOMP);
10
#endif
11

12
#ifdef CONFIG_SECCOMP
13
  current->seccomp.mode = 0;
14
  current->seccomp.filter = NULL;
15
  atomic_set(&current->seccomp.filter_count, 0);
16
#else
17
#endif
18
}

清除seccomp标志位并且直接关闭当前进程的seccomp

SELinux#

调用 setup_selinux 更改domain

详见selinux

feature#

1
#ifndef __KSU_H_FEATURE
2
#define __KSU_H_FEATURE
3

4
#include <linux/types.h>
5

6
enum ksu_feature_id {
7
    KSU_FEATURE_SU_COMPAT = 0,
8
    KSU_FEATURE_KERNEL_UMOUNT = 1,
9
    KSU_FEATURE_ENHANCED_SECURITY = 2,
10

11
    KSU_FEATURE_MAX
12
};
13

14
typedef int (*ksu_feature_get_t)(u64 *value);
15
typedef int (*ksu_feature_set_t)(u64 value);
16

17
struct ksu_feature_handler {
18
    u32 feature_id;
19
    const char *name;
20
    ksu_feature_get_t get_handler;
21
    ksu_feature_set_t set_handler;
22
};
23
//注册功能
24
int ksu_register_feature_handler(const struct ksu_feature_handler *handler);
25
//注销功能
26
int ksu_unregister_feature_handler(u32 feature_id);
27
//获取功能状态
28
int ksu_get_feature(u32 feature_id, u64 *value, bool *supported);
29
//设置功能状态
30
int ksu_set_feature(u32 feature_id, u64 value);
31

32
void ksu_feature_init(void);
33

34
void ksu_feature_exit(void);
35

36
#endif // __KSU_H_FEATURE

这个模块实现了一个可拓展的功能管理框架

目前有三个功能：

Su兼容模式 -> sucompat模块

内核umount -> kernel_umount模块

增强安全性 -> setuid_hook模块

‍

manager通过ioctl来调用get_feature和set_feature来控制功能是否开启

详见supercalls模块

kernel_umount#

直接看功能实现函数

1
int ksu_handle_umount(uid_t old_uid, uid_t new_uid)
2
{
3
    struct umount_tw *tw;
4

5
    // if there isn't any module mounted, just ignore it!
6
    if (!ksu_module_mounted) {
7
        return 0;
8
    }
9

10
    if (!ksu_kernel_umount_enabled) {
11
        return 0;
12
    }
13

14
    // There are 5 scenarios:
15
    // 1. Normal app: zygote -> appuid
16
    // 2. Isolated process forked from zygote: zygote -> isolated_process
17
    // 3. App zygote forked from zygote: zygote -> appuid
18
    // 4. Isolated process froked from app zygote: appuid -> isolated_process (already handled by 3)
19
    // 5. Isolated process froked from webview zygote (no need to handle, app cannot run custom code)
20
    if (!is_appuid(new_uid) && !is_isolated_process(new_uid)) {
21
        return 0;
22
    }
23

24
    if (!ksu_uid_should_umount(new_uid) && !is_isolated_process(new_uid)) {
25
        return 0;
26
    }
27

28
    // check old process's selinux context, if it is not zygote, ignore it!
29
    // because some su apps may setuid to untrusted_app but they are in global mount namespace
30
    // when we umount for such process, that is a disaster!
31
    // also handle case 4 and 5
32
    bool is_zygote_child = is_zygote(get_current_cred());
33
    if (!is_zygote_child) {
34
        pr_info("handle umount ignore non zygote child: %d\n", current->pid);
35
        return 0;
36
    }
37
    // umount the target mnt
38
    pr_info("handle umount for uid: %d, pid: %d\n", new_uid, current->pid);
39

40
    tw = kzalloc(sizeof(*tw), GFP_ATOMIC);
41
    if (!tw)
42
        return 0;
43

44
    tw->old_cred = get_current_cred();
45
    tw->cb.func = umount_tw_func;
46

47
    int err = task_work_add(current, &tw->cb, TWA_RESUME);
48
    if (err) {
49
        if (tw->old_cred) {
50
            put_cred(tw->old_cred);
51
        }
52
        kfree(tw);
53
        pr_warn("unmount add task_work failed\n");
54
    }
55

56
    return 0;
57
}

这个函数在setuid这个系统调用被触发后调用，详见 setuid_hook 模块

注释列出了5中情形，其中只需要处理1、2、3三种即可

这里其实有一个问题， task_work_add 添加的回调，会在返回用户态前再执行，也就是说在这个回调被执行时，setuid系统调用已经执行完成

而在zygote孵化子进程的核心函数 SpecializeCommon中

注释说，在setuid的系统调用后，进程的权能将被清空

而进行 mount/umount 需要 CAP_SYS_ADMIN 这个权能

所以此时其实是没办法进行mount/umount操作的

1
static void umount_tw_func(struct callback_head *cb)
2
{
3
    struct umount_tw *tw = container_of(cb, struct umount_tw, cb);
4
    const struct cred *saved = NULL;
5
    if (tw->old_cred) {
6
        saved = override_creds(tw->old_cred);
7
    }
8

9
    struct mount_entry *entry;
10
    down_read(&mount_list_lock);
11
    list_for_each_entry(entry, &mount_list, list) {
12
        pr_info("%s: unmounting: %s flags 0x%x\n", __func__, entry->umountable, entry->flags);
13
        try_umount(entry->umountable, entry->flags);
14
    }
15
    up_read(&mount_list_lock);
16

17
    if (saved)
18
        revert_creds(saved);
19

20
    if (tw->old_cred)
21
        put_cred(tw->old_cred);
22

23
    kfree(tw);
24
}

所以ksu提前备份了 setuid 之前的 cred，在执行umount替换当前 cred，执行完 umount 操作后再恢复 cred

这样就确保了能够正常进行umount操作

ksu#

1
#include <linux/export.h>
2
#include <linux/fs.h>
3
#include <linux/kobject.h>
4
#include <linux/module.h>
5
#include <linux/workqueue.h>
6

7
#include "allowlist.h"
8
#include "feature.h"
9
#include "klog.h" // IWYU pragma: keep
10
#include "throne_tracker.h"
11
#include "syscall_hook_manager.h"
12
#include "ksud.h"
13
#include "supercalls.h"
14

15
int __init kernelsu_init(void)
16
{
17
#ifdef CONFIG_KSU_DEBUG
18
    pr_alert("*************************************************************");
19
    pr_alert("**     NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE    **");
20
    pr_alert("**                                                         **");
21
    pr_alert("**         You are running KernelSU in DEBUG mode          **");
22
    pr_alert("**                                                         **");
23
    pr_alert("**     NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE    **");
24
    pr_alert("*************************************************************");
25
#endif
26

27
    ksu_feature_init();
28

29
    ksu_supercalls_init();
30

31
    ksu_syscall_hook_manager_init();
32

33
    ksu_allowlist_init();
34

35
    ksu_throne_tracker_init();
36

37
    ksu_ksud_init();
38

39
#ifdef MODULE
40
#ifndef CONFIG_KSU_DEBUG
41
    kobject_del(&THIS_MODULE->mkobj.kobj);
42
#endif
43
#endif
44
    return 0;
45
}
46

47
extern void ksu_observer_exit(void);
48
void kernelsu_exit(void)
49
{
50
    ksu_allowlist_exit();
51

52
    ksu_throne_tracker_exit();
53

54
    ksu_observer_exit();
55

56
    ksu_ksud_exit();
57

58
    ksu_syscall_hook_manager_exit();
59

60
    ksu_supercalls_exit();
61

62
    ksu_feature_exit();
63
}
64

65
module_init(kernelsu_init);
66
module_exit(kernelsu_exit);
67

68
MODULE_LICENSE("GPL");
69
MODULE_AUTHOR("weishu");
70
MODULE_DESCRIPTION("Android KernelSU");
71
#if LINUX_VERSION_CODE >= KERNEL_VERSION(6, 13, 0)
72
MODULE_IMPORT_NS("VFS_internal_I_am_really_a_filesystem_and_am_NOT_a_driver");
73
#else
74
MODULE_IMPORT_NS(VFS_internal_I_am_really_a_filesystem_and_am_NOT_a_driver);
75
#endif

整个内核模块的入口和出口

1
#ifdef MODULE
2
#ifndef CONFIG_KSU_DEBUG
3
    kobject_del(&THIS_MODULE->mkobj.kobj);
4
#endif
5
#endif

隐藏自身内核模块

ksud#

1
#ifndef __KSU_H_KSUD
2
#define __KSU_H_KSUD
3

4
#include <linux/types.h>
5

6
#define KSUD_PATH "/data/adb/ksud"
7

8
void ksu_ksud_init();
9
void ksu_ksud_exit();
10

11
void on_post_fs_data(void);
12
void on_module_mounted(void);
13
void on_boot_completed(void);
14

15
bool ksu_is_safe_mode(void);
16

17
int nuke_ext4_sysfs(const char* mnt);
18

19
extern u32 ksu_file_sid;
20
extern bool ksu_module_mounted;
21
extern bool ksu_boot_completed;
22

23
#endif

主要实现了三类功能

init进程监控#

1
// IMPORTANT NOTE: the call from execve_handler_pre WON'T provided correct value for envp and flags in GKI version
2
int ksu_handle_execveat_ksud(int *fd, struct filename **filename_ptr,
3
                             struct user_arg_ptr *argv,
4
                             struct user_arg_ptr *envp, int *flags)
5
{
6
    struct filename *filename;
7

8
    static const char app_process[] = "/system/bin/app_process";
9
    static bool first_app_process = true;
10

11
    /* This applies to versions Android 10+ */
12
    static const char system_bin_init[] = "/system/bin/init";
13
    /* This applies to versions between Android 6 ~ 9  */
14
    static const char old_system_init[] = "/init";
15
    static bool init_second_stage_executed = false;
16

17
    if (!filename_ptr)
18
        return 0;
19

20
    filename = *filename_ptr;
21
    if (IS_ERR(filename)) {
22
        return 0;
23
    }
24

25
    if (unlikely(!memcmp(filename->name, system_bin_init,
26
                         sizeof(system_bin_init) - 1) &&
27
                 argv)) {
28
        // /system/bin/init executed
29
        int argc = count(*argv, MAX_ARG_STRINGS);
30
        pr_info("/system/bin/init argc: %d\n", argc);
31
        if (argc > 1 && !init_second_stage_executed) {
32
            const char __user *p = get_user_arg_ptr(*argv, 1);
33
            if (p && !IS_ERR(p)) {
34
                char first_arg[16];
35
                strncpy_from_user_nofault(first_arg, p, sizeof(first_arg));
36
                pr_info("/system/bin/init first arg: %s\n", first_arg);
37
                if (!strcmp(first_arg, "second_stage")) {
38
                    pr_info("/system/bin/init second_stage executed\n");
39
                    apply_kernelsu_rules();
40
                    init_second_stage_executed = true;
41
                }
42
            } else {
43
                pr_err("/system/bin/init parse args err!\n");
44
            }
45
        }
46
    } else if (unlikely(!memcmp(filename->name, old_system_init,
47
                                sizeof(old_system_init) - 1) &&
48
                        argv)) {
49
        // /init executed
50
        int argc = count(*argv, MAX_ARG_STRINGS);
51
        pr_info("/init argc: %d\n", argc);
52
        if (argc > 1 && !init_second_stage_executed) {
53
            /* This applies to versions between Android 6 ~ 7 */
54
            const char __user *p = get_user_arg_ptr(*argv, 1);
55
            if (p && !IS_ERR(p)) {
56
                char first_arg[16];
57
                strncpy_from_user_nofault(first_arg, p, sizeof(first_arg));
58
                pr_info("/init first arg: %s\n", first_arg);
59
                if (!strcmp(first_arg, "--second-stage")) {
60
                    pr_info("/init second_stage executed\n");
61
                    apply_kernelsu_rules();
62
                    init_second_stage_executed = true;
63
                }
64
            } else {
65
                pr_err("/init parse args err!\n");
66
            }
67
        } else if (argc == 1 && !init_second_stage_executed && envp) {
68
            /* This applies to versions between Android 8 ~ 9  */
69
            int envc = count(*envp, MAX_ARG_STRINGS);
70
            if (envc > 0) {
71
                int n;
72
                for (n = 1; n <= envc; n++) {
73
                    const char __user *p = get_user_arg_ptr(*envp, n);
74
                    if (!p || IS_ERR(p)) {
75
                        continue;
76
                    }
77
                    char env[256];
78
                    // Reading environment variable strings from user space
79
                    if (strncpy_from_user_nofault(env, p, sizeof(env)) < 0)
80
                        continue;
81
                    // Parsing environment variable names and values
82
                    char *env_name = env;
83
                    char *env_value = strchr(env, '=');
84
                    if (env_value == NULL)
85
                        continue;
86
                    // Replace equal sign with string terminator
87
                    *env_value = '\0';
88
                    env_value++;
89
                    // Check if the environment variable name and value are matching
90
                    if (!strcmp(env_name, "INIT_SECOND_STAGE") &&
91
                        (!strcmp(env_value, "1") ||
92
                         !strcmp(env_value, "true"))) {
93
                        pr_info("/init second_stage executed\n");
94
                        apply_kernelsu_rules();
95
                        init_second_stage_executed = true;
96
                    }
97
                }
98
            }
99
        }
100
    }
101

102
    if (unlikely(first_app_process && !memcmp(filename->name, app_process,
103
                                              sizeof(app_process) - 1))) {
104
        first_app_process = false;
105
        pr_info("exec app_process, /data prepared, second_stage: %d\n",
106
                init_second_stage_executed);
107
        struct task_struct *init_task;
108
        rcu_read_lock();
109
        init_task = rcu_dereference(current->real_parent);
110
        if (init_task) {
111
            task_work_add(init_task, &on_post_fs_data_cb, TWA_RESUME);
112
        }
113
        rcu_read_unlock();
114

115
        stop_execve_hook();
116
    }
117

118
    return 0;
119
}
120

121
static int sys_execve_handler_pre(struct kprobe *p, struct pt_regs *regs)
122
{
123
    struct pt_regs *real_regs = PT_REAL_REGS(regs);
124
    const char __user **filename_user =
125
        (const char **)&PT_REGS_PARM1(real_regs);
126
    const char __user *const __user *__argv =
127
        (const char __user *const __user *)PT_REGS_PARM2(real_regs);
128
    struct user_arg_ptr argv = { .ptr.native = __argv };
129
    struct filename filename_in, *filename_p;
130
    char path[32];
131
    long ret;
132
    unsigned long addr;
133
    const char __user *fn;
134

135
    if (!filename_user)
136
        return 0;
137

138
    addr = untagged_addr((unsigned long)*filename_user);
139
    fn = (const char __user *)addr;
140

141
    memset(path, 0, sizeof(path));
142
    ret = strncpy_from_user_nofault(path, fn, 32);
143
    if (ret < 0 && try_set_access_flag(addr)) {
144
        ret = strncpy_from_user_nofault(path, fn, 32);
145
    }
146
    if (ret < 0) {
147
        pr_err("Access filename failed for execve_handler_pre\n");
148
        return 0;
149
    }
150
    filename_in.name = path;
151

152
    filename_p = &filename_in;
153
    return ksu_handle_execveat_ksud(AT_FDCWD, &filename_p, &argv, NULL, NULL);
154
}

ksu hook了sys_execve 这个系统调用

‍

当执行init第二阶段时调用 apply_kernelsu_rules 来添加ksu自带的SELinux规则，详见SELinux模块

当执行到 app_process 说明init进程已完成，

此时调用on_post_fs_data 并且停止hook sys_execve

1
void on_post_fs_data(void)
2
{
3
    static bool done = false;
4
    if (done) {
5
        pr_info("on_post_fs_data already done\n");
6
        return;
7
    }
8
    done = true;
9
    pr_info("on_post_fs_data!\n");
10
    ksu_load_allow_list();//加载ksu的配置列表
11
    ksu_observer_init();//开始监控manager是否存在
12
    // sanity check, this may influence the performance
13
    stop_input_hook();//停止安全模式案件监控
14

15
    ksu_file_sid = ksu_get_ksu_file_sid();
16
    pr_info("ksu_file sid: %d\n", ksu_file_sid);
17
}

ksud启动#

1
static int ksu_handle_vfs_read(struct file **file_ptr, char __user **buf_ptr,
2
                               size_t *count_ptr, loff_t **pos)
3
{
4
    struct file *file;
5
    char __user *buf;
6
    size_t count;
7

8
    if (strcmp(current->comm, "init")) {
9
        // we are only interest in `init` process
10
        return 0;
11
    }
12

13
    file = *file_ptr;
14
    if (IS_ERR(file)) {
15
        return 0;
16
    }
17

18
    if (!d_is_reg(file->f_path.dentry)) {
19
        return 0;
20
    }
21

22
    const char *short_name = file->f_path.dentry->d_name.name;
23
    if (strcmp(short_name, "atrace.rc")) {
24
        // we are only interest `atrace.rc` file name file
25
        return 0;
26
    }
27
    char path[256];
28
    char *dpath = d_path(&file->f_path, path, sizeof(path));
29

30
    if (IS_ERR(dpath)) {
31
        return 0;
32
    }
33

34
    if (strcmp(dpath, "/system/etc/init/atrace.rc")) {
35
        return 0;
36
    }
37

38
    // we only process the first read
39
    static bool rc_inserted = false;
40
    if (rc_inserted) {
41
        // we don't need this kprobe, unregister it!
42
        stop_vfs_read_hook();
43
        return 0;
44
    }
45
    rc_inserted = true;
46

47
    // now we can sure that the init process is reading
48
    // `/system/etc/init/atrace.rc`
49
    buf = *buf_ptr;
50
    count = *count_ptr;
51

52
    size_t rc_count = strlen(KERNEL_SU_RC);
53

54
    pr_info("vfs_read: %s, comm: %s, count: %zu, rc_count: %zu\n", dpath,
55
            current->comm, count, rc_count);
56

57
    if (count < rc_count) {
58
        pr_err("count: %zu < rc_count: %zu\n", count, rc_count);
59
        return 0;
60
    }
61

62
    size_t ret = copy_to_user(buf, KERNEL_SU_RC, rc_count);
63
    if (ret) {
64
        pr_err("copy ksud.rc failed: %zu\n", ret);
65
        return 0;
66
    }
67

68
    // we've succeed to insert ksud.rc, now we need to proxy the read and modify the result!
69
    // But, we can not modify the file_operations directly, because it's in read-only memory.
70
    // We just replace the whole file_operations with a proxy one.
71
    memcpy(&fops_proxy, file->f_op, sizeof(struct file_operations));
72
    orig_read = file->f_op->read;
73
    if (orig_read) {
74
        fops_proxy.read = read_proxy;
75
    }
76
    orig_read_iter = file->f_op->read_iter;
77
    if (orig_read_iter) {
78
        fops_proxy.read_iter = read_iter_proxy;
79
    }
80
    // replace the file_operations
81
    file->f_op = &fops_proxy;
82
    read_count_append = rc_count;
83

84
    *buf_ptr = buf + rc_count;
85
    *count_ptr = count - rc_count;
86

87
    return 0;
88
}

ksu hook了sys_read 这个系统调用，用来监控 init 过程中的文件读取

在 init 读取 atrace.rc 时，将 KERNEL_SU_RC 插入原本的rc中

由于我们无法直接操作file_operation结构体中的成员，所以我们必须直接替换file结构体中的file_operation 指针，指向我们自定义的file_operation结构体

1
struct file {
2
  union {
3
    struct llist_node  f_llist;
4
    struct rcu_head   f_rcuhead;
5
    unsigned int     f_iocb_flags;
6
  };
7
  struct path    f_path;
8
  struct inode    *f_inode;  /* cached value */
9
  const struct file_operations  *f_op;      /*替换他*/
10

11
  /*
12
   * Protects f_ep, f_flags.
13
   * Must not be taken from IRQ context.
14
   */
15
  spinlock_t    f_lock;
16
  atomic_long_t    f_count;
17
  unsigned int     f_flags;
18
  fmode_t      f_mode;
19
  struct mutex    f_pos_lock;
20
  loff_t      f_pos;
21
  struct fown_struct  f_owner;
22
  const struct cred  *f_cred;
23
  struct file_ra_state  f_ra;
24

25
  u64      f_version;
26
#ifdef CONFIG_SECURITY
27
  void      *f_security;
28
#endif
29
  /* needed for tty driver, and maybe others */
30
  void      *private_data;
31

32
#ifdef CONFIG_EPOLL
33
  /* Used by fs/eventpoll.c to link all the hooks to this file */
34
  struct hlist_head  *f_ep;
35
#endif /* #ifdef CONFIG_EPOLL */
36
  struct address_space  *f_mapping;
37
  errseq_t    f_wb_err;
38
  errseq_t    f_sb_err; /* for syncfs */
39

40
  ANDROID_KABI_RESERVE(1);
41
  ANDROID_KABI_RESERVE(2);
42
}

1
static ssize_t read_proxy(struct file *file, char __user *buf, size_t count,
2
                          loff_t *pos)
3
{
4
    bool first_read = file->f_pos == 0;
5
    ssize_t ret = orig_read(file, buf, count, pos);
6
    if (first_read) {
7
        pr_info("read_proxy append %ld + %ld\n", ret, read_count_append);
8
        ret += read_count_append;
9
    }
10
    return ret;
11
}
12

13
static ssize_t read_iter_proxy(struct kiocb *iocb, struct iov_iter *to)
14
{
15
    bool first_read = iocb->ki_pos == 0;
16
    ssize_t ret = orig_read_iter(iocb, to);
17
    if (first_read) {
18
        pr_info("read_iter_proxy append %ld + %ld\n", ret, read_count_append);
19
        ret += read_count_append;
20
    }
21
    return ret;
22
}

代理了read和read_iter使其返回正确的长度

1
static const char KERNEL_SU_RC[] =
2
    "\n"
3

4
    "on post-fs-data\n"
5
    "    start logd\n"
6
    // We should wait for the post-fs-data finish
7
    "    exec u:r:su:s0 root -- " KSUD_PATH " post-fs-data\n"
8
    "\n"
9

10
    "on nonencrypted\n"
11
    "    exec u:r:su:s0 root -- " KSUD_PATH " services\n"
12
    "\n"
13

14
    "on property:vold.decrypt=trigger_restart_framework\n"
15
    "    exec u:r:su:s0 root -- " KSUD_PATH " services\n"
16
    "\n"
17

18
    "on property:sys.boot_completed=1\n"
19
    "    exec u:r:su:s0 root -- " KSUD_PATH " boot-completed\n"
20
    "\n"
21

22
    "\n";

这样， init在执行atrace.rc时，就会执行 KERNEL_SU_RC 的内容，在特定阶段启动ksud

安全模式#

1
static struct kprobe input_event_kp = {
2
    .symbol_name = "input_event",
3
    .pre_handler = input_handle_event_handler_pre,
4
};

直接hook了input_event这个函数

1
static unsigned int volumedown_pressed_count = 0;
2

3
static bool is_volumedown_enough(unsigned int count)
4
{
5
    return count >= 3;
6
}
7

8
int ksu_handle_input_handle_event(unsigned int *type, unsigned int *code,
9
                                  int *value)
10
{
11
    if (*type == EV_KEY && *code == KEY_VOLUMEDOWN) {
12
        int val = *value;
13
        pr_info("KEY_VOLUMEDOWN val: %d\n", val);
14
        if (val) {
15
            // key pressed, count it
16
            volumedown_pressed_count += 1;
17
            if (is_volumedown_enough(volumedown_pressed_count)) {
18
                stop_input_hook();
19
            }
20
        }
21
    }
22

23
    return 0;
24
}
25

26
bool ksu_is_safe_mode()
27
{
28
    static bool safe_mode = false;
29
    if (safe_mode) {
30
        // don't need to check again, userspace may call multiple times
31
        return true;
32
    }
33

34
    // stop hook first!
35
    stop_input_hook();
36

37
    pr_info("volumedown_pressed_count: %d\n", volumedown_pressed_count);
38
    if (is_volumedown_enough(volumedown_pressed_count)) {
39
        // pressed over 3 times
40
        pr_info("KEY_VOLUMEDOWN pressed max times, safe mode detected!\n");
41
        safe_mode = true;
42
        return true;
43
    }
44

45
    return false;
46
}

监控音量下键按下次数，次数达到三次就会进入安全模式，然后交由ksud执行安全模式的操作

pkg_observer#

1
#define MASK_SYSTEM (FS_CREATE | FS_MOVE | FS_EVENT_ON_CHILD)
2

3
static struct watch_dir g_watch = { .path = "/data/system",
4
                    .mask = MASK_SYSTEM };
5

6
static int ksu_handle_inode_event(struct fsnotify_mark *mark, u32 mask,
7
                  struct inode *inode, struct inode *dir,
8
                  const struct qstr *file_name, u32 cookie)
9
{
10
    if (!file_name)
11
        return 0;
12
    if (mask & FS_ISDIR)
13
        return 0;
14
    if (file_name->len == 13 &&
15
        !memcmp(file_name->name, "packages.list", 13)) {
16
        pr_info("packages.list detected: %d\n", mask);
17
        track_throne(false);
18
    }
19
    return 0;
20
}
21

22
static const struct fsnotify_ops ksu_ops = {
23
    .handle_inode_event = ksu_handle_inode_event,
24
};
25

26

27
int ksu_observer_init(void)
28
{
29
    int ret = 0;
30

31
#if LINUX_VERSION_CODE >= KERNEL_VERSION(6, 0, 0)
32
    g = fsnotify_alloc_group(&ksu_ops, 0);
33
#else
34
    g = fsnotify_alloc_group(&ksu_ops);
35
#endif
36
    if (IS_ERR(g))
37
        return PTR_ERR(g);
38

39
    ret = watch_one_dir(&g_watch);
40
    pr_info("observer init done\n");
41
    return 0;
42
}

使用fsnotify监控了/data/system这个目录下文件/目录的创建移动

如果检测到packages.list 的变化，就会执行track_throne(false)

详见throne_tracker模块

seccomp_cache#

1
#ifndef __KSU_H_KERNEL_COMPAT
2
#define __KSU_H_KERNEL_COMPAT
3

4
#include <linux/fs.h>
5
#include <linux/version.h>
6

7
extern void ksu_seccomp_clear_cache(struct seccomp_filter *filter, int nr);
8
extern void ksu_seccomp_allow_cache(struct seccomp_filter *filter, int nr);
9

10
#endif

用于清除/恢复seccomp的cache功能

setuid_hook#

1
static bool ksu_enhanced_security_enabled = false;
2

3
static int enhanced_security_feature_get(u64 *value)
4
{
5
    *value = ksu_enhanced_security_enabled ? 1 : 0;
6
    return 0;
7
}
8

9
static int enhanced_security_feature_set(u64 value)
10
{
11
    bool enable = value != 0;
12
    ksu_enhanced_security_enabled = enable;
13
    pr_info("enhanced_security: set to %d\n", enable);
14
    return 0;
15
}
16

17
static const struct ksu_feature_handler enhanced_security_handler = {
18
    .feature_id = KSU_FEATURE_ENHANCED_SECURITY,
19
    .name = "enhanced_security",
20
    .get_handler = enhanced_security_feature_get,
21
    .set_handler = enhanced_security_feature_set,
22
};

主要是实现了增强安全性(enhanced_security)这个功能和未开启增强安全性时常规的提权

直接看功能实现函数

1
int ksu_handle_setresuid(uid_t ruid, uid_t euid, uid_t suid)
2
{
3
    // we rely on the fact that zygote always call setresuid(3) with same uids
4
    uid_t new_uid = ruid;
5
    uid_t old_uid = current_uid().val;
6

7
    pr_info("handle_setresuid from %d to %d\n", old_uid, new_uid);
8

9
    // if old process is root, ignore it.
10
    if (old_uid != 0 && ksu_enhanced_security_enabled) {
11
        // disallow any non-ksu domain escalation from non-root to root!
12
        // euid is what we care about here as it controls permission
13
        if (unlikely(euid == 0)) {
14
            if (!is_ksu_domain()) {
15
                pr_warn("find suspicious EoP: %d %s, from %d to %d\n",
16
                    current->pid, current->comm, old_uid, new_uid);
17
                force_sig(SIGKILL);
18
                return 0;
19
            }
20
        }
21
        // disallow appuid decrease to any other uid if it is not allowed to su
22
        if (is_appuid(old_uid)) {
23
            if (euid < current_euid().val && !ksu_is_allow_uid_for_current(old_uid)) {
24
                pr_warn("find suspicious EoP: %d %s, from %d to %d\n",
25
                    current->pid, current->comm, old_uid, new_uid);
26
                force_sig(SIGKILL);
27
                return 0;
28
            }
29
        }
30
        return 0;
31
    }
32

33
    // if on private space, see if its possibly the manager
34
    if (new_uid > PER_USER_RANGE && new_uid % PER_USER_RANGE == ksu_get_manager_uid()) {
35
        ksu_set_manager_uid(new_uid);
36
    }
37

38
    if (ksu_get_manager_uid() == new_uid) {
39
        pr_info("install fd for manager: %d\n", new_uid);
40
        ksu_install_fd();
41
        spin_lock_irq(&current->sighand->siglock);
42
        ksu_seccomp_allow_cache(current->seccomp.filter, __NR_reboot);
43
        ksu_set_task_tracepoint_flag(current);
44
        spin_unlock_irq(&current->sighand->siglock);
45
        return 0;
46
    }
47

48
    if (ksu_is_allow_uid_for_current(new_uid)) {
49
        if (current->seccomp.mode == SECCOMP_MODE_FILTER &&
50
            current->seccomp.filter) {
51
            spin_lock_irq(&current->sighand->siglock);
52
            ksu_seccomp_allow_cache(current->seccomp.filter, __NR_reboot);
53
            spin_unlock_irq(&current->sighand->siglock);
54
        }
55
        ksu_set_task_tracepoint_flag(current);
56
    } else {
57
        ksu_clear_task_tracepoint_flag_if_needed(current);
58
    }
59

60
    // Handle kernel umount
61
    ksu_handle_umount(old_uid, new_uid);
62

63
    return 0;
64
}

开启增强安全性后，将会阻止ksu_domain 外的所有进程通过setresuid从非root提升到root

阻止所有app通过setresuid降低自己的euid

sucompat#

实现了su兼容性这个功能

模块内处理了三种系统调用

1
#define SU_PATH "/system/bin/su"
2
int ksu_handle_faccessat(int *dfd, const char __user **filename_user, int *mode,
3
                         int *__unused_flags)
4
{
5
    const char su[] = SU_PATH;
6

7
    if (!ksu_is_allow_uid_for_current(current_uid().val)) {
8
        return 0;
9
    }
10

11
    char path[sizeof(su) + 1];
12
    memset(path, 0, sizeof(path));
13
    strncpy_from_user_nofault(path, *filename_user, sizeof(path));
14

15
    if (unlikely(!memcmp(path, su, sizeof(su)))) {
16
        pr_info("faccessat su->sh!\n");
17
        *filename_user = sh_user_path();
18
    }
19

20
    return 0;
21
}
22

23
int ksu_handle_stat(int *dfd, const char __user **filename_user, int *flags)
24
{
25
    // const char sh[] = SH_PATH;
26
    const char su[] = SU_PATH;
27

28
    if (!ksu_is_allow_uid_for_current(current_uid().val)) {
29
        return 0;
30
    }
31

32
    if (unlikely(!filename_user)) {
33
        return 0;
34
    }
35

36
    char path[sizeof(su) + 1];
37
    memset(path, 0, sizeof(path));
38
    strncpy_from_user_nofault(path, *filename_user, sizeof(path));
39

40
    if (unlikely(!memcmp(path, su, sizeof(su)))) {
41
        pr_info("newfstatat su->sh!\n");
42
        *filename_user = sh_user_path();
43
    }
44

45
    return 0;
46
}

在获取/system/bin/su的属性时，实际上被替换为/system/bin/sh 的属性

1
int ksu_handle_execve_sucompat(const char __user **filename_user,
2
                               void *__never_use_argv, void *__never_use_envp,
3
                               int *__never_use_flags)
4
{
5
    const char su[] = SU_PATH;
6
    const char __user *fn;
7
    char path[sizeof(su) + 1];
8
    long ret;
9
    unsigned long addr;
10

11
    if (unlikely(!filename_user))
12
        return 0;
13

14
    if (!ksu_is_allow_uid_for_current(current_uid().val))
15
        return 0;
16

17
    addr = untagged_addr((unsigned long)*filename_user);
18
    fn = (const char __user *)addr;
19
    memset(path, 0, sizeof(path));
20
    ret = strncpy_from_user_nofault(path, fn, sizeof(path));
21

22
    if (ret < 0 && try_set_access_flag(addr)) {
23
        ret = strncpy_from_user_nofault(path, fn, sizeof(path));
24
    }
25

26
    if (ret < 0 && preempt_count()) {
27
        /* This is crazy, but we know what we are doing:
28
         * Temporarily exit atomic context to handle page faults, then restore it */
29
        pr_info("Access filename failed, try rescue..\n");
30
        preempt_enable_no_resched_notrace();
31
        ret = strncpy_from_user(path, fn, sizeof(path));
32
        preempt_disable_notrace();
33
    }
34

35
    if (ret < 0) {
36
        pr_warn("Access filename when execve failed: %ld", ret);
37
        return 0;
38
    }
39

40
    if (likely(memcmp(path, su, sizeof(su))))
41
        return 0;
42

43
    pr_info("sys_execve su found\n");
44
    *filename_user = ksud_user_path();
45

46
    escape_with_root_profile();
47

48
    return 0;
49
}

当进程尝试执行/system/bin/su 时，filename被替换为ksud的路径，并且执行提权操作

ksu_su_compat_enabled实际上影响了syscall_hook_manager模块中的ksu_sys_enter_handler函数

1
tatic void ksu_sys_enter_handler(void *data, struct pt_regs *regs, long id)
2
{
3
  if (unlikely(check_syscall_fastpath(id))) {
4
    if (ksu_su_compat_enabled) {
5
      // Handle newfstatat
6
      if (id == __NR_newfstatat) {
7
        int *dfd = (int *)&PT_REGS_PARM1(regs);
8
        const char __user **filename_user =
9
          (const char __user **)&PT_REGS_PARM2(regs);
10
        int *flags = (int *)&PT_REGS_SYSCALL_PARM4(regs);
11
        ksu_handle_stat(dfd, filename_user, flags);
12
        return;
13
      }
14

15
      // Handle faccessat
16
      if (id == __NR_faccessat) {
17
        int *dfd = (int *)&PT_REGS_PARM1(regs);
18
        const char __user **filename_user =
19
          (const char __user **)&PT_REGS_PARM2(regs);
20
        int *mode = (int *)&PT_REGS_PARM3(regs);
21
        ksu_handle_faccessat(dfd, filename_user, mode, NULL);
22
        return;
23
      }
24

25
      // Handle execve
26
      if (id == __NR_execve) {
27
        const char __user **filename_user =
28
          (const char __user **)&PT_REGS_PARM1(regs);
29
        if (current->pid != 1 && is_init(get_current_cred())) {
30
          ksu_handle_init_mark_tracker(filename_user);
31
        } else {
32
                    ksu_handle_execve_sucompat(filename_user, NULL, NULL, NULL);
33
                }
34
        return;
35
      }
36
    }
37

38
        // Handle setresuid
39
    if (id == __NR_setresuid) {
40
      uid_t ruid = (uid_t)PT_REGS_PARM1(regs);
41
      uid_t euid = (uid_t)PT_REGS_PARM2(regs);
42
      uid_t suid = (uid_t)PT_REGS_PARM3(regs);
43
      ksu_handle_setresuid(ruid, euid, suid);
44
      return;
45
    }
46
  }
47
}

开启su兼容性将使得任何进程都无法通过su命令来获取root权限（已经提权过的进程不受影响）

supercall#

1
bool ksu_su_compat_enabled __read_mostly = true;
2

3
static int su_compat_feature_get(u64 *value)
4
{
5
    *value = ksu_su_compat_enabled ? 1 : 0;
6
    return 0;
7
}
8

9
static int su_compat_feature_set(u64 value)
10
{
11
    bool enable = value != 0;
12
    ksu_su_compat_enabled = enable;
13
    pr_info("su_compat: set to %d\n", enable);
14
    return 0;
15
}
16

17
static const struct ksu_feature_handler su_compat_handler = {
18
    .feature_id = KSU_FEATURE_SU_COMPAT,
19
    .name = "su_compat",
20
    .get_handler = su_compat_feature_get,
21
    .set_handler = su_compat_feature_set,
22
};

这个模块巧妙地通过 hook sys_reboot 函数分发ioctl的匿名fd实现了用户态与内核态的通信

1
// IOCTL handlers mapping table
2
static const struct ksu_ioctl_cmd_map ksu_ioctl_handlers[] = {
3
    { .cmd = KSU_IOCTL_GRANT_ROOT, .name = "GRANT_ROOT", .handler = do_grant_root, .perm_check = allowed_for_su },
4
    { .cmd = KSU_IOCTL_GET_INFO, .name = "GET_INFO", .handler = do_get_info, .perm_check = always_allow },
5
    { .cmd = KSU_IOCTL_REPORT_EVENT, .name = "REPORT_EVENT", .handler = do_report_event, .perm_check = only_root },
6
    { .cmd = KSU_IOCTL_SET_SEPOLICY, .name = "SET_SEPOLICY", .handler = do_set_sepolicy, .perm_check = only_root },
7
    { .cmd = KSU_IOCTL_CHECK_SAFEMODE, .name = "CHECK_SAFEMODE", .handler = do_check_safemode, .perm_check = always_allow },
8
    { .cmd = KSU_IOCTL_GET_ALLOW_LIST, .name = "GET_ALLOW_LIST", .handler = do_get_allow_list, .perm_check = manager_or_root },
9
    { .cmd = KSU_IOCTL_GET_DENY_LIST, .name = "GET_DENY_LIST", .handler = do_get_deny_list, .perm_check = manager_or_root },
10
    { .cmd = KSU_IOCTL_UID_GRANTED_ROOT, .name = "UID_GRANTED_ROOT", .handler = do_uid_granted_root, .perm_check = manager_or_root },
11
    { .cmd = KSU_IOCTL_UID_SHOULD_UMOUNT, .name = "UID_SHOULD_UMOUNT", .handler = do_uid_should_umount, .perm_check = manager_or_root },
12
    { .cmd = KSU_IOCTL_GET_MANAGER_UID, .name = "GET_MANAGER_UID", .handler = do_get_manager_uid, .perm_check = manager_or_root },
13
    { .cmd = KSU_IOCTL_GET_APP_PROFILE, .name = "GET_APP_PROFILE", .handler = do_get_app_profile, .perm_check = only_manager },
14
    { .cmd = KSU_IOCTL_SET_APP_PROFILE, .name = "SET_APP_PROFILE", .handler = do_set_app_profile, .perm_check = only_manager },
15
    { .cmd = KSU_IOCTL_GET_FEATURE, .name = "GET_FEATURE", .handler = do_get_feature, .perm_check = manager_or_root },
16
    { .cmd = KSU_IOCTL_SET_FEATURE, .name = "SET_FEATURE", .handler = do_set_feature, .perm_check = manager_or_root },
17
    { .cmd = KSU_IOCTL_GET_WRAPPER_FD, .name = "GET_WRAPPER_FD", .handler = do_get_wrapper_fd, .perm_check = manager_or_root },
18
    { .cmd = KSU_IOCTL_MANAGE_MARK, .name = "MANAGE_MARK", .handler = do_manage_mark, .perm_check = manager_or_root },
19
    { .cmd = KSU_IOCTL_NUKE_EXT4_SYSFS, .name = "NUKE_EXT4_SYSFS", .handler = do_nuke_ext4_sysfs, .perm_check = manager_or_root },
20
    { .cmd = KSU_IOCTL_ADD_TRY_UMOUNT, .name = "ADD_TRY_UMOUNT", .handler = add_try_umount, .perm_check = manager_or_root },
21
    { .cmd = 0, .name = NULL, .handler = NULL, .perm_check = NULL } // Sentinel
22
};

同时实现了相当多的命令，以及命令执行的权限校验机制

大部分命令都是直接调用其他模块的函数，不再分析

fd的分发#

1
// Install KSU fd to current process
2
int ksu_install_fd(void)
3
{
4
    struct file *filp;
5
    int fd;
6

7
    // Get unused fd
8
    fd = get_unused_fd_flags(O_CLOEXEC);
9
    if (fd < 0) {
10
        pr_err("ksu_install_fd: failed to get unused fd\n");
11
        return fd;
12
    }
13

14
    // Create anonymous inode file
15
    filp = anon_inode_getfile("[ksu_driver]", &anon_ksu_fops, NULL, O_RDWR | O_CLOEXEC);
16
    if (IS_ERR(filp)) {
17
        pr_err("ksu_install_fd: failed to create anon inode file\n");
18
        put_unused_fd(fd);
19
        return PTR_ERR(filp);
20
    }
21

22
    // Install fd
23
    fd_install(fd, filp);
24

25
    pr_info("ksu fd installed: %d for pid %d\n", fd, current->pid);
26

27
    return fd;
28
}
29

30
static void ksu_install_fd_tw_func(struct callback_head *cb)
31
{
32
    struct ksu_install_fd_tw *tw = container_of(cb, struct ksu_install_fd_tw, cb);
33
    int fd = ksu_install_fd();
34
    pr_info("[%d] install ksu fd: %d\n", current->pid, fd);
35

36
    if (copy_to_user(tw->outp, &fd, sizeof(fd))) {
37
        pr_err("install ksu fd reply err\n");
38
#if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 11, 0)
39
        close_fd(fd);
40
#else
41
        ksys_close(fd);
42
#endif
43
    }
44

45
    kfree(tw);
46
}
47

48

49
static int reboot_handler_pre(struct kprobe *p, struct pt_regs *regs)
50
{
51
    struct pt_regs *real_regs = PT_REAL_REGS(regs);
52
    int magic1 = (int)PT_REGS_PARM1(real_regs);
53
    int magic2 = (int)PT_REGS_PARM2(real_regs);
54
    unsigned long arg4;
55

56
    // Check if this is a request to install KSU fd
57
    if (magic1 == KSU_INSTALL_MAGIC1 && magic2 == KSU_INSTALL_MAGIC2) {
58
        struct ksu_install_fd_tw *tw;
59

60
        arg4 = (unsigned long)PT_REGS_SYSCALL_PARM4(real_regs);
61

62
        tw = kzalloc(sizeof(*tw), GFP_ATOMIC);
63
        if (!tw)
64
            return 0;
65

66
        tw->outp = (int __user *)arg4;
67
        tw->cb.func = ksu_install_fd_tw_func;
68

69
        if (task_work_add(current, &tw->cb, TWA_RESUME)) {
70
            kfree(tw);
71
            pr_warn("install fd add task_work failed\n");
72
        }
73
    }
74

75
    return 0;
76
}
77

78
static struct kprobe reboot_kp = {
79
    .symbol_name = REBOOT_SYMBOL,
80
    .pre_handler = reboot_handler_pre,
81
};

hook 了sys_reboot，首先检查传入的前两个参数是否为特定的Magic Num

如果检查通过，ksu将会创建匿名设备和fd,并且将这个fd与自定义的file_operation关联

最后将fd写入参数中，供用户态程序使用

内核ioctl分发器#

1
// IOCTL dispatcher
2
static long anon_ksu_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
3
{
4
    void __user *argp = (void __user *)arg;
5
    int i;
6

7
#ifdef CONFIG_KSU_DEBUG
8
    pr_info("ksu ioctl: cmd=0x%x from uid=%d\n", cmd, current_uid().val);
9
#endif
10

11
    for (i = 0; ksu_ioctl_handlers[i].handler; i++) {
12
        if (cmd == ksu_ioctl_handlers[i].cmd) {
13
            // Check permission first
14
            if (ksu_ioctl_handlers[i].perm_check &&
15
                !ksu_ioctl_handlers[i].perm_check()) {
16
                pr_warn("ksu ioctl: permission denied for cmd=0x%x uid=%d\n",
17
                    cmd, current_uid().val);
18
                return -EPERM;
19
            }
20
            // Execute handler
21
            return ksu_ioctl_handlers[i].handler(argp);
22
        }
23
    }
24

25
    pr_warn("ksu ioctl: unsupported command 0x%x\n", cmd);
26
    return -ENOTTY;
27
}

根据传入的cmd来执行寻找制定命令，进行权限校验，并执行命令handler

syscall_hook_manager#

这个模块是系统调用的主拦截点，并且通过非常巧妙的方式修复了之前出现的侧信道检测问题

KernelSU检测之“时间侧信道攻击”

1
void ksu_syscall_hook_manager_init(void)
2
{
3
  int ret;
4
  pr_info("hook_manager: ksu_hook_manager_init called\n");
5

6
#ifdef CONFIG_KRETPROBES
7
  // Register kretprobe for syscall_regfunc
8
  syscall_regfunc_rp = init_kretprobe("syscall_regfunc", syscall_regfunc_handler);
9
  // Register kretprobe for syscall_unregfunc
10
  syscall_unregfunc_rp = init_kretprobe("syscall_unregfunc", syscall_unregfunc_handler);
11
#endif
12

13
#ifdef CONFIG_HAVE_SYSCALL_TRACEPOINTS
14
  ret = register_trace_sys_enter(ksu_sys_enter_handler, NULL);
15
#ifndef CONFIG_KRETPROBES
16
  ksu_mark_running_process_locked();
17
#endif
18
  if (ret) {
19
    pr_err("hook_manager: failed to register sys_enter tracepoint: %d\n", ret);
20
  } else {
21
    pr_info("hook_manager: sys_enter tracepoint registered\n");
22
  }
23
#endif
24

25
  ksu_setuid_hook_init();
26
  ksu_sucompat_init();
27
}

syscall_hook_manager 抛弃了之前直接使用krpobe hook系统调用的方式(性能较差)

转而通过TracePoints直接hook sys_enter ，根据参数来判断执行的系统调用

1
static int syscall_regfunc_handler(struct kretprobe_instance *ri, struct pt_regs *regs)
2
{
3
  unsigned long flags;
4
  spin_lock_irqsave(&tracepoint_reg_lock, flags);
5
  if (tracepoint_reg_count < 1) {
6
    // while install our tracepoint, mark our processes
7
    ksu_mark_running_process_locked();
8
  } else if (tracepoint_reg_count == 1) {
9
    // while other tracepoint first added, mark all processes
10
    ksu_mark_all_process();
11
  }
12
  tracepoint_reg_count++;
13
  spin_unlock_irqrestore(&tracepoint_reg_lock, flags);
14
  return 0;
15
}
16

17
static int syscall_unregfunc_handler(struct kretprobe_instance *ri, struct pt_regs *regs)
18
{
19
  unsigned long flags;
20
  spin_lock_irqsave(&tracepoint_reg_lock, flags);
21
  tracepoint_reg_count--;
22
  if (tracepoint_reg_count <= 0) {
23
    // while no tracepoint left, unmark all processes
24
    ksu_unmark_all_process();
25
  } else if (tracepoint_reg_count == 1) {
26
    // while just our tracepoint left, unmark disallowed processes
27
    ksu_mark_running_process_locked();
28
  }
29
  spin_unlock_irqrestore(&tracepoint_reg_lock, flags);
30
  return 0;
31
}

同时，ksu使用了kretprobe hook注册 tracepoints 要经过的syscall_regfunc 和 syscall_unregfunc 函数

维护了 tracepoint_reg_count 用来判断当前是否只有ksu注册了tracepoint

为什么要这么做？

实际上，tracepoints的生效依赖于进程的thread_info 中的 SYSCALL_TRACEPOINT 标志位

为了对抗侧信道检测，ksu会将所有非必要进程的 SYSCALL_TRACEPOINT 标志位置为0

这样，对于我们未授予权限的进程，根本不会触发这个tracepoint,自然也就无法通过执行时间侧信道检测ksu的存在

但是这里有一个问题，如果除了ksu还有别的tracepoint怎么办？

这时ksu会直接将所有进程的SYSCALL_TRACEPOINT 标志位置为1,以保证其他工具的正常使用

1
// Tracepoint registration count management
2
// == 1: just us
3
// >  1: someone else is also using syscall tracepoint e.g. ftrace
4
static int tracepoint_reg_count = 0;
5
static DEFINE_SPINLOCK(tracepoint_reg_lock);
6

7
void ksu_clear_task_tracepoint_flag_if_needed(struct task_struct *t)
8
{
9
  unsigned long flags;
10
  spin_lock_irqsave(&tracepoint_reg_lock, flags);
11
  if (tracepoint_reg_count <= 1) {
12
    ksu_clear_task_tracepoint_flag(t);
13
  }
14
  spin_unlock_irqrestore(&tracepoint_reg_lock, flags);
15
}
16

17
// Process marking management
18
static void handle_process_mark(bool mark)
19
{
20
  struct task_struct *p, *t;
21
  read_lock(&tasklist_lock);
22
  for_each_process_thread(p, t) {
23
    if (mark)
24
      ksu_set_task_tracepoint_flag(t);
25
    else
26
      ksu_clear_task_tracepoint_flag(t);
27
  }
28
  read_unlock(&tasklist_lock);
29
}
30

31
void ksu_mark_all_process(void)
32
{
33
  handle_process_mark(true);
34
  pr_info("hook_manager: mark all user process done!\n");
35
}
36

37
void ksu_unmark_all_process(void)
38
{
39
  handle_process_mark(false);
40
  pr_info("hook_manager: unmark all user process done!\n");
41
}
42

43
static void ksu_mark_running_process_locked()
44
{
45
  struct task_struct *p, *t;
46
  read_lock(&tasklist_lock);
47
  for_each_process_thread (p, t) {
48
    if (!t->mm) { // only user processes
49
      continue;
50
    }
51
    int uid = task_uid(t).val;
52
        const struct cred *cred = get_task_cred(t);
53
    bool ksu_root_process =
54
      uid == 0 && is_task_ksu_domain(cred);
55
        bool is_zygote_process = is_zygote(cred);
56
        bool is_shell = uid == 2000;
57
        // before boot completed, we shall mark init for marking zygote
58
        bool is_init = t->pid == 1;
59
    if (ksu_root_process || is_zygote_process  || is_shell || is_init
60
            || ksu_is_allow_uid(uid)) {
61
      ksu_set_task_tracepoint_flag(t);
62
      pr_info("hook_manager: mark process: pid:%d, uid: %d, comm:%s\n",
63
          t->pid, uid, t->comm);
64
    } else {
65
      ksu_clear_task_tracepoint_flag(t);
66
      pr_info("hook_manager: unmark process: pid:%d, uid: %d, comm:%s\n",
67
          t->pid, uid, t->comm);
68
    }
69
        put_cred(cred);
70
  }
71
  read_unlock(&tasklist_lock);
72
}
73

74
void ksu_mark_running_process()
75
{
76
  unsigned long flags;
77
  spin_lock_irqsave(&tracepoint_reg_lock, flags);
78
  if (tracepoint_reg_count <= 1) {
79
    ksu_mark_running_process_locked();
80
  } else {
81
    pr_info("hook_manager: not mark running process since syscall tracepoint is in use\n");
82
  }
83
  spin_unlock_irqrestore(&tracepoint_reg_lock, flags);
84
}
85

86
// Get task mark status
87
// Returns: 1 if marked, 0 if not marked, -ESRCH if task not found
88
int ksu_get_task_mark(pid_t pid)
89
{
90
  struct task_struct *task;
91
  int marked = -ESRCH;
92

93
  rcu_read_lock();
94
  task = find_task_by_vpid(pid);
95
  if (task) {
96
    get_task_struct(task);
97
    rcu_read_unlock();
98
#if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 11, 0)
99
    marked = test_task_syscall_work(task, SYSCALL_TRACEPOINT) ? 1 : 0;
100
#else
101
    marked = test_tsk_thread_flag(task, TIF_SYSCALL_TRACEPOINT) ? 1 : 0;
102
#endif
103
    put_task_struct(task);
104
  } else {
105
    rcu_read_unlock();
106
  }
107

108
  return marked;
109
}
110

111
// Set task mark status
112
// Returns: 0 on success, -ESRCH if task not found
113
int ksu_set_task_mark(pid_t pid, bool mark)
114
{
115
  struct task_struct *task;
116
  int ret = -ESRCH;
117

118
  rcu_read_lock();
119
  task = find_task_by_vpid(pid);
120
  if (task) {
121
    get_task_struct(task);
122
    rcu_read_unlock();
123
    if (mark) {
124
      ksu_set_task_tracepoint_flag(task);
125
      pr_info("hook_manager: marked task pid=%d comm=%s\n", pid, task->comm);
126
    } else {
127
      ksu_clear_task_tracepoint_flag(task);
128
      pr_info("hook_manager: unmarked task pid=%d comm=%s\n", pid, task->comm);
129
    }
130
    put_task_struct(task);
131
    ret = 0;
132
  } else {
133
    rcu_read_unlock();
134
  }
135

136
  return ret;
137
}

throne_tacker#

实现了两个功能，定位管理器和清理allow_list无用项

1
void track_throne(bool prune_only)
2
{
3
    struct file *fp = filp_open(SYSTEM_PACKAGES_LIST_PATH, O_RDONLY, 0);
4
    if (IS_ERR(fp)) {
5
        pr_err("%s: open " SYSTEM_PACKAGES_LIST_PATH " failed: %ld\n", __func__,
6
               PTR_ERR(fp));
7
        return;
8
    }
9

10
    struct list_head uid_list;
11
    INIT_LIST_HEAD(&uid_list);
12

13
    char chr = 0;
14
    loff_t pos = 0;
15
    loff_t line_start = 0;
16
    char buf[KSU_MAX_PACKAGE_NAME];
17
    for (;;) {
18
        ssize_t count = kernel_read(fp, &chr, sizeof(chr), &pos);
19
        if (count != sizeof(chr))
20
            break;
21
        if (chr != '\n')
22
            continue;
23

24
        count = kernel_read(fp, buf, sizeof(buf), &line_start);
25

26
        struct uid_data *data = kzalloc(sizeof(struct uid_data), GFP_ATOMIC);
27
        if (!data) {
28
            filp_close(fp, 0);
29
            goto out;
30
        }
31

32
        char *tmp = buf;
33
        const char *delim = " ";
34
        char *package = strsep(&tmp, delim);
35
        char *uid = strsep(&tmp, delim);
36
        if (!uid || !package) {
37
            pr_err("update_uid: package or uid is NULL!\n");
38
            break;
39
        }
40

41
        u32 res;
42
        if (kstrtou32(uid, 10, &res)) {
43
            pr_err("update_uid: uid parse err\n");
44
            break;
45
        }
46
        data->uid = res;
47
        strncpy(data->package, package, KSU_MAX_PACKAGE_NAME);
48
        list_add_tail(&data->list, &uid_list);
49
        // reset line start
50
        line_start = pos;
51
    }
52
    filp_close(fp, 0);
53

54
    // now update uid list
55
    struct uid_data *np;
56
    struct uid_data *n;
57

58
    if (prune_only)
59
        goto prune;
60

61
    // first, check if manager_uid exist!
62
    bool manager_exist = false;
63
    list_for_each_entry (np, &uid_list, list) {
64
        // if manager is installed in work profile, the uid in packages.list is still equals main profile
65
        // don't delete it in this case!
66
        int manager_uid = ksu_get_manager_uid() % 100000;
67
        if (np->uid == manager_uid) {
68
            manager_exist = true;
69
            break;
70
        }
71
    }
72

73
    if (!manager_exist) {
74
        if (ksu_is_manager_uid_valid()) {
75
            pr_info("manager is uninstalled, invalidate it!\n");
76
            ksu_invalidate_manager_uid();
77
            goto prune;
78
        }
79
        pr_info("Searching manager...\n");
80
        search_manager("/data/app", 2, &uid_list);
81
        pr_info("Search manager finished\n");
82
    }
83

84
prune:
85
    // then prune the allowlist
86
    ksu_prune_allowlist(is_uid_exist, &uid_list);
87
out:
88
    // free uid_list
89
    list_for_each_entry_safe (np, n, &uid_list, list) {
90
        list_del(&np->list);
91
        kfree(np);
92
    }
93
}

首先，遍历了packages.list 获取所有app的包名和uid

随后使用两种寻找策略寻找manager_uid是否仍有效

如果无效则执行清除原有manager_uid

随后执行ksu_prune_allowlist清理allow_list

‍

file_wrapper#

可以看到，ksu添加了ksu_file 这个文件类型，并且授予所有主体权限

对传入的fd进行包装，把他包装为ksu_file，然后返回

最后使用dup2完成同步

此时，root shell和终端应用均能访问这三种fd,

use proxy file for pts

主要是为了解决类似 Running pm from Termux fails 类似的问题

假设一个以 u:r:untrusted_app:s0 域运行的终端应用，如Termux

他执行了su命令，此时在内核会被替换成execve(“ksud”), ksud接着返回root shell

如果不做任何处理，作为应用的子进程，这个shell会沿用父进程的pts

而父进程的pts的SELinux上下文为u:object_r:untrusted_app_all_devpts:s0

root shell进程的域为su, 但是su这个主体并没有被授予 untrusted_app_all_devpts 的读写权限

1
[pixel@Britney setools]$ sesearch /home/pixel/Documents/evolutionX/out/target/product/oriole/vendor/etc/selinux/precompiled_sepolicy  -A -s su -t untrusted_app_all_devpts -c chr_file -p write
2
[pixel@Britney setools]$

所以此时的root shell是无法与我们的终端交互的，就会导致某些终端完全卡死，无法输入也无任何输出

为了解决这个问题，旧版的ksu直接hook了pts创建过程中调用的函数

1
int ksu_handle_devpts(struct inode *inode)
2
{
3
  if (!current->mm) {
4
    return 0;
5
  }
6

7
  uid_t uid = current_uid().val;
8
  if (uid % 100000 < 10000) {
9
    // not untrusted_app, ignore it
10
    return 0;
11
  }
12

13
  if (!ksu_is_allow_uid(uid))
14
    return 0;
15

16
  if (ksu_devpts_sid) {
17
#if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 1, 0)
18
    struct inode_security_struct *sec = selinux_inode(inode);
19
#else
20
    struct inode_security_struct *sec =
21
      (struct inode_security_struct *)inode->i_security;
22
#endif
23
    if (sec) {
24
      sec->sid = ksu_devpts_sid;
25
    }
26
  }
27

28
  return 0;
29
}
30

31
#define DEVPTS_DOMAIN "u:object_r:devpts:s0"
32

33
u32 ksu_get_devpts_sid()
34
{
35
  u32 devpts_sid = 0;
36
  int err = security_secctx_to_secid(DEVPTS_DOMAIN, strlen(DEVPTS_DOMAIN),
37
             &devpts_sid);
38
  if (err) {
39
    pr_info("get devpts sid err %d\n", err);
40
  }
41
  return devpts_sid;
42
}

强制替换pts的sid为ksu_devpts_sid，这样所有 untrusted_app 创建的终端的SELinux上下文都会被改为u:object_r:devpts:s0

1
[pixel@Britney setools]$ sesearch /home/pixel/Documents/evolutionX/out/target/product/oriole/vendor/etc/selinux/precompiled_sepolicy  -A -s untrusted_app_all -t devpts -c chr_file -p write
2
allow appdomain devpts:chr_file { getattr ioctl read write };
3
[pixel@Britney setools]$ sesearch /home/pixel/Documents/evolutionX/out/target/product/oriole/vendor/etc/selinux/precompiled_sepolicy  -A -s su -t devpts -c chr_file -p write
4
allow appdomain devpts:chr_file { getattr ioctl read write };

su和untrusted_app 均有权访问

‍

在新版的ksu中，采取了另一种方法来突破这个限制（似乎有误，实际上测试下来发现仍然是直接修改的pts的sid？但是代码确实是这么写的啊）

在ksud的su.rs中

1
#[cfg(target_os = "android")]
2
fn wrap_tty(fd: c_int) {
3
    let inner_fn = move || -> Result<()> {
4
        if unsafe { libc::isatty(fd) != 1 } {
5
            return Ok(());
6
        }
7
        let new_fd = get_wrapped_fd(fd).context("get_wrapped_fd")?;
8
        if unsafe { libc::dup2(new_fd, fd) } == -1 {
9
            bail!("dup {new_fd} -> {fd} errno: {}", unsafe {
10
                *libc::__errno()
11
            });
12
        }
13
        unsafe { libc::close(new_fd) };
14
        Ok(())
15
    };
16

17
    if let Err(e) = inner_fn() {
18
        error!("wrap tty {fd}: {e:?}");
19
    }
20
}
21

22
#[cfg(not(any(target_os = "linux", target_os = "android")))]
23
pub fn root_shell() -> Result<()> {
24
    unimplemented!()
25
}
26

27
#[cfg(any(target_os = "linux", target_os = "android"))]
28
#[allow(clippy::similar_names)]
29
pub fn root_shell() -> Result<()> {
30
    // we are root now, this was set in kernel!
31

32
.................
33

34

35
    // escape from the current cgroup and become session leader
36
    // WARNING!!! This cause some root shell hang forever!
37
    // command = command.process_group(0);
38
    command = unsafe {
39
        command.pre_exec(move || {
40
            umask(0o22);
41
            utils::switch_cgroups();
42

43
            // switch to global mount namespace
44
            #[cfg(any(target_os = "linux", target_os = "android"))]
45
            if mount_master {
46
                let _ = utils::switch_mnt_ns(1);
47
            }
48

49
            #[cfg(target_os = "android")]
50
            if use_fd_wrapper {
51
                wrap_tty(0);
52
                wrap_tty(1);
53
                wrap_tty(2);
54
            }
55

56
            set_identity(uid, gid, &groups);
57

58
            Result::Ok(())
59
        })
60
    };
61

62
    command = command.args(args).arg0(arg0);
63
    Err(command.exec().into())
64
}

ksud会把原本的fd 0，1，2进行包装，也就是标准输入输出和错误

1
static int do_get_wrapper_fd(void __user *arg) {
2
    if (!ksu_file_sid) {
3
        return -EINVAL;
4
    }
5

6
    struct ksu_get_wrapper_fd_cmd cmd;
7
    int ret;
8

9
    if (copy_from_user(&cmd, arg, sizeof(cmd))) {
10
        pr_err("get_wrapper_fd: copy_from_user failed\n");
11
        return -EFAULT;
12
    }
13

14
    struct file* f = fget(cmd.fd);
15
    if (!f) {
16
        return -EBADF;
17
    }
18

19
    struct ksu_file_wrapper *data = ksu_create_file_wrapper(f);
20
    if (data == NULL) {
21
        ret = -ENOMEM;
22
        goto put_orig_file;
23
    }
24

25
#if LINUX_VERSION_CODE >= KERNEL_VERSION(6, 12, 0)
26
#define getfd_secure anon_inode_create_getfd
27
#else
28
#define getfd_secure anon_inode_getfd_secure
29
#endif
30
    ret = getfd_secure("[ksu_fdwrapper]", &data->ops, data, f->f_flags, NULL);
31
    if (ret < 0) {
32
        pr_err("ksu_fdwrapper: getfd failed: %d\n", ret);
33
        goto put_wrapper_data;
34
    }
35
    struct file* pf = fget(ret);
36

37
    struct inode* wrapper_inode = file_inode(pf);
38
    // copy original inode mode
39
    wrapper_inode->i_mode = file_inode(f)->i_mode;
40
    struct inode_security_struct *sec = selinux_inode(wrapper_inode);
41
    if (sec) {
42
        sec->sid = ksu_file_sid;
43
    }
44

45
    fput(pf);
46
    goto put_orig_file;
47
put_wrapper_data:
48
    ksu_delete_file_wrapper(data);
49
put_orig_file:
50
    fput(f);
51

52
    return ret;
53
}

‍

1
    // Create unconstrained file type
2
    ksu_type(db, KERNEL_SU_FILE, "file_type");
3
    ksu_typeattribute(db, KERNEL_SU_FILE, "mlstrustedobject");
4
    ksu_allow(db, ALL, KERNEL_SU_FILE, ALL, ALL);

‍

1
        if unsafe { libc::dup2(new_fd, fd) } == -1 {
2
            bail!("dup {new_fd} -> {fd} errno: {}", unsafe {
3
                *libc::__errno()
4
            });
5
        }

SELinux#

1
#ifndef __KSU_H_SELINUX
2
#define __KSU_H_SELINUX
3

4
#include "linux/types.h"
5
#include "linux/version.h"
6
#include "linux/cred.h"
7

8
void setup_selinux(const char *);
9

10
void setenforce(bool);
11

12
bool getenforce();
13

14
bool is_task_ksu_domain(const struct cred* cred);
15

16
bool is_ksu_domain();
17

18
bool is_zygote(const struct cred* cred);
19

20
bool is_init(const struct cred* cred);
21

22
void apply_kernelsu_rules();
23

24
u32 ksu_get_ksu_file_sid();
25

26
int handle_sepolicy(unsigned long arg3, void __user *arg4);
27

28
#endif
29

30
void setup_selinux(const char *domain)
31
{
32
    if (transive_to_domain(domain)) {
33
        pr_err("transive domain failed.\n");
34
        return;
35
    }
36
}

主要实现了selinux Domain的切换和一些关于SELinux的工具函数

1
static int transive_to_domain(const char *domain)
2
{
3
    struct cred *cred;
4
    struct task_security_struct *tsec;
5
    u32 sid;
6
    int error;
7

8
    cred = (struct cred *)__task_cred(current);
9

10
    tsec = cred->security;
11
    if (!tsec) {
12
        pr_err("tsec == NULL!\n");
13
        return -1;
14
    }
15

16
    error = security_secctx_to_secid(domain, strlen(domain), &sid);
17
    if (error) {
18
        pr_info("security_secctx_to_secid %s -> sid: %d, error: %d\n",
19
            domain, sid, error);
20
    }
21
    if (!error) {
22
        tsec->sid = sid;
23
        tsec->create_sid = 0;
24
        tsec->keycreate_sid = 0;
25
        tsec->sockcreate_sid = 0;
26
    }
27
    return error;
28
}

sepolicy#

1
#ifndef __KSU_H_SEPOLICY
2
#define __KSU_H_SEPOLICY
3

4
#include <linux/types.h>
5

6
#include "ss/policydb.h"
7

8
// Operation on types
9
bool ksu_type(struct policydb *db, const char *name, const char *attr);
10
bool ksu_attribute(struct policydb *db, const char *name);
11
bool ksu_permissive(struct policydb *db, const char *type);
12
bool ksu_enforce(struct policydb *db, const char *type);
13
bool ksu_typeattribute(struct policydb *db, const char *type, const char *attr);
14
bool ksu_exists(struct policydb *db, const char *type);
15

16
// Access vector rules
17
bool ksu_allow(struct policydb *db, const char *src, const char *tgt,
18
           const char *cls, const char *perm);
19
bool ksu_deny(struct policydb *db, const char *src, const char *tgt,
20
          const char *cls, const char *perm);
21
bool ksu_auditallow(struct policydb *db, const char *src, const char *tgt,
22
            const char *cls, const char *perm);
23
bool ksu_dontaudit(struct policydb *db, const char *src, const char *tgt,
24
           const char *cls, const char *perm);
25

26
// Extended permissions access vector rules
27
bool ksu_allowxperm(struct policydb *db, const char *src, const char *tgt,
28
            const char *cls, const char *range);
29
bool ksu_auditallowxperm(struct policydb *db, const char *src, const char *tgt,
30
             const char *cls, const char *range);
31
bool ksu_dontauditxperm(struct policydb *db, const char *src, const char *tgt,
32
            const char *cls, const char *range);
33

34
// Type rules
35
bool ksu_type_transition(struct policydb *db, const char *src, const char *tgt,
36
             const char *cls, const char *def, const char *obj);
37
bool ksu_type_change(struct policydb *db, const char *src, const char *tgt,
38
             const char *cls, const char *def);
39
bool ksu_type_member(struct policydb *db, const char *src, const char *tgt,
40
             const char *cls, const char *def);
41

42
// File system labeling
43
bool ksu_genfscon(struct policydb *db, const char *fs_name, const char *path,
44
          const char *ctx);
45

46
#endif

实现了一套强大的policydb动态修补api，通过操纵内存中的policydb结构体，实现了动态修补SELinux规则

ksud部分#

‍

KernelSU#

kernel部分#

各模块分析#

allowlist#

app_sign#

app_profile#

传统linux权限#

设置uid / gid / group#

设置capabilities#

为什么要给进程添加​cap_dac_read_search​ 能力？#

Seccomp#

SELinux#

feature#

kernel_umount#

ksu#

ksud#

init进程监控#

ksud启动#

安全模式#

pkg_observer#

seccomp_cache#

setuid_hook#

sucompat#

supercall#

fd的分发#

内核ioctl分发器#

syscall_hook_manager#

throne_tacker#

file_wrapper#

SELinux#

sepolicy#

ksud部分#

#

为什么要给进程添加`cap_dac_read_search` 能力？#