新版梆梆检测绕过#

0x00 前言#

其实本来应该连dex解密流程一块讲的，但是上周一直在加班，没有时间写完，所以拆成两篇来写吧，这篇先只讲一下如何绕过frida检测，祈祷我下周不要再加班了

0x01 linker mini版#

入手#

IDA打开发现导入表空空如也，无需多言，先dump修复一份so，IDA打开之后发现只有寥寥数个函数，并且注册了constructor函数，那只好先去入口处看看了

1
__int64 sub_4780()
2
{
3
  _DWORD *j; // x2
4
  void *libc_handle; // x0
5
  int i; // [xsp-60h] [xbp-90h]
6
  int k; // [xsp-14h] [xbp-44h]
7

8
  for ( i = 273; i != 70; i = 70 )
9
    ;
10
  for ( j = (_DWORD *)((unsigned __int64)sub_4780 & 0xFFFFFFFFFFFFF000LL); *j != 0x464C457F; j -= 1024 )// ELF魔数
11
    ;
12
  shell_base = (__int64)j;
13
  libc_handle = dlopen("libc.so", 2);
14
  g_scanf = (__int64 (*)(_QWORD, const char *, ...))dlsym(libc_handle, "sscanf");
15
  for ( k = 273; k != 70; k = 70 )
16
    ;
17
  dword_15040 = dword_15008;                    // 0x8000
18
  dword_15064 = dword_1500C;                    // 0x1608
19
  dword_15078 = dword_15010;                    // 0x877
20
  dword_15030 = dword_15014;                    // 0x159000
21
  dword_15088 = dword_15018;                    // 0x15B000
22
  dword_15084 = dword_1501C;                    // 0x15C000
23
  dword_1507C = dword_15020;                    // 0x1181DD
24
  return sub_33F8();                            // 主加载流程
25
}

这是入口函数，上来就会被调用，其中0x464C457F是ELF魔数，这段代码在从自身页面开始往上扫描，直到扫描到ELF魔数，从而查找自身的基地址，然后拿到sscanf的地址，存到全局变量中。我也不晓得这一通操作意欲何为。前一个还可以理解，这么做会比较节省时间，至于sscanf，直接拿来用不就行了吗，他这里还查找这个符号然后保存有点没理解，有懂的大牛子可以解释一下

然后就是保存一些全局变量，都是写死的偏移或者秘钥信息，比较重要，后续解密时会用到。最后就是这个壳so最重要的函数了sub_33F8()

定位#

建议如果要分析的话，先看看这个简单的项目吧，因为项目里so加载流程和这个壳不能说100%一样，但是也有90%是一样的 Yuuki/soLoader

这个函数有900多行，不算很复杂，而且核心函数一目了然。它调用了 mmap，dlopen，mprotect等函数，结合之前发现的，1.36M的so，反编译之后就几个函数，其他地方都是被加密的，那不难猜到这个函数的作用就是在运行时动态解密释放真正的so，然后真正的so再去对dex做解密等操作。如果是简单的upx壳，那么大概率不会使用到dlopen，因为upx只需要申请内存，解密payload即可，但是这里它调用了dlopen，还是在一个循环中调用的

1
do {
2
    while ( *v76 != 1 )  {
3
        v76 += 2;
4
        if ( v76 == v91 )
5
            goto LABEL_186;
6
        }
7
        v92 = v76[1];
8
        v76 += 2;
9
        *(&v123 + (int)v90++) = (__int64)dlopen((const char *)(v118 + v92), 2);
10
    }
11
while ( v76 != v91 );

这很明显就是在处理DT_NEEDED条目了，那么这个函数，基本上可以初步判断为一个简易的linker，职责是加载真正的so

那么我们当下的直接目标就是解密出真正的so，所以先来简单分析一下这个函数吧~，我只截取关键的部分，感兴趣的可以自己从头看看

1
v5 = fopen("/proc/self/maps", "r");
2
  memset(v143, 0, 0x400u);
3
  v123 = 0;
4
  v122 = 0;
5
  memset(v142, 0, 0x100u);
6
  while ( fgets((char *)v143, 1024, v5) )       // 解析maps，根据shell_base判断是否为so自身，取出so路径
7
  {
8
    g_scanf(v143, "%lx-%lx %s %s %s %s %s", &v122, &v123, v142, v142, v142, v142, so_path);
9
    if ( v122 <= shell_base && shell_base < v123 )
10
      break;
11
  }
12
  fclose(v5);
13
  v102 = so_path;
14
  so_file_handle = open((const char *)so_path, 0x80000);

这里反编译之后跟看源码没啥区别。先解析maps，根据上面拿到的 so 基地址来判断当前条目是否命中，命中取出 so 路径，为了拿到libDexHelper.so的路径。这里这么做是因为android加载so时，会从 /data/app/一串神秘代码/libs 下加载，而厂商的代码是写死的，他不知道这个神秘代码是啥就拿不到文件的磁盘路径，所以需要这样获取一下。当然我觉得直接在内存里操作也是可以的，不过这个看个人喜好了

拿到路径之后，它做了如下三件事情

1
pread(so_file_handle, &qword_15050, 0x14u, (unsigned int)dword_1507C);// 从0x1181DD读20字节
2
dword_15080 = dword_15060;
3
memset(so_path, 0, 64);
4
qword_15068 = qword_15050;
5
qword_15070 = qword_15058;
6
pread(so_file_handle, so_path, 0x40u, (unsigned int)dword_15040);// 从0x8000读64字节
7
((void (__fastcall *)(_QWORD *, _QWORD))sub_3184)(so_path, (unsigned int)dword_15040);// RC4解密64字节 7F454C4602010... 这是ELF头

读了磁盘上的so的特定偏移的一些数据，这些偏移地址是写死的，上述初始化函数里提到过。其中 sub_3184是一个变种的RC4算法，秘钥用的是qword_15068，qword_15068来自从0x1181DD读的20字节，所以这一块的逻辑就是，读取秘钥，读取要解密的64字节，调用解密函数，解密

解密出的数据如下：

7F454C460201010000000000000000000300B70001000000B0F8000000000000400000000000000000F71000000000000000000040003800080040001A001900

这完全验证了我们之前的猜想，这是一个标准的ELF头，所以这个函数的确是一个迷你的linker，并且我们已经拿到了ELF头的解密算法，接下来就是找剩下的数据是如何被加密的了

1
v36 = v35;
2
v111 = v35;
3
v37 = (unsigned __int8 *)mmap((void *)((v32 + v110) & 0xFFFFFFFFFFFFF000LL), v35, 3, 50, 0, 0);// 对每个 `PT_LOAD` 段做映射/拷贝
4
v38 = v37;
5
if ( v37 == (unsigned __int8 *)-1LL )
6
  break;
7
v39 = HIDWORD(v113);
8
if ( lseek(SHIDWORD(v113), (unsigned int)v107 & 0xFFFFF000, 0) == -1 )
9
  break;
10
v112 = read(v39, v37, v36);         // 读取每个段内容
11
if ( (_DWORD)v112 == -1 )
12
  break;
13
if ( v28 != 1 ) {
14
  ((void (__fastcall *)(unsigned __int8 *, _QWORD, _QWORD))sub_2B1C)(v37, 0, (unsigned int)v112);// 循环调用xor解密函数，解密各个段
15
    goto LABEL_124;
16
}
17
v40 = v133;
18
v131 = 0;
19
v132 = 30;
20
v133[0] = 273;

关键解密函数是sub_2B1C，这就是一个简单的xor加解密

1
char *__fastcall sub_2B1C(__int64 a1, int a2, int a3)
2
{
3
  char *result; // x0
4
  char *v4; // x3
5
  char v5; // t1
6
  int i; // [xsp-34h] [xbp-44h]
7

8
  for ( i = 273; i != 70; i = 70 )
9
    ;
10
  result = (char *)(a1 + a2);
11
  v4 = result;
12
  if ( a3 )
13
  {
14
    do
15
    {
16
      v5 = *v4++;
17
      *(v4 - 1) = dword_15080 ^ v5;             // xor 0x41
18
    }
19
    while ( a3 > (unsigned __int64)(unsigned int)((_DWORD)v4 - (_DWORD)result) );
20
  }
21
  return result;
22
}

秘钥是0x41，之前读20字节的时候读出来的，那么就可以静态解密出真正的so了。当然你也可以运行时动态dump，我看见有的朋友是直接在dlopen onLeave的时候扫描匿名可执行内存，然后直接dump的，这样也可以的，并且不用分析壳so的逻辑，建议大家这么做

分析到这里就可以解密出主so了，但是本着来都来的的心态，还是看看后面它做了哪些操作吧

1
v21 = (void *)(v12 & 0xFFFFF000);
2
v22 = ((v17 + 4095) & 0xFFFFF000) - (unsigned int)v21;
3
real_base = mmap(v21, v22, 3, 34, -1, 0);   // 分配匿名内存，用于映射真正的so

1
if ( mprotect(v38, v111, (*(_DWORD *)v29 >> 2) & 1 | *(_DWORD *)v29 & 2 | (4 * (*(_DWORD *)v29 & 1))) == -1 )// 恢复各个段的权限
2
goto LABEL_131;
3
if ( (*(_DWORD *)v29 & 2) != 0 )
4
  break;
5
v67 = (*(_DWORD *)v29 >> 2) & 1 | 2;
6
v68 = (*(_DWORD *)v29 & 1) != 0 ? 4 : 0;
7
v29 += 56LL;
8
mprotect(v38, v111, v67 | v68);
9
v30 = v25 == ++v27;

1
((void (__fastcall *)(unsigned __int64, __int64, __int64, _QWORD, __int64 *, _QWORD, __int64))sub_2CD0)(// 一种重定位
2
            v119,
3
            v118,
4
            v123,
5
            (unsigned int)v124,
6
            &v123,
7
            v90,
8
            v117);
9
          ((void (__fastcall *)(unsigned __int64, __int64, __int64, _QWORD, __int64 *, _QWORD, __int64))sub_2CD0)(// 另一种重定位
10
            v93,
11
            v94,
12
            v129,
13
            (unsigned int)len,
14
            &v123,
15
            v90,
16
            v95);

1
 v57 = ((__int64 (__fastcall *)(unsigned __int64, const void *, _QWORD, __int64, __int64))sub_303C)(// 查找JNI_OnLoad
2
                  v107,
3
                  v106,
4
                  (unsigned int)v115,
5
                  v109,
6
                  v110);
7
          if ( v80 != (void (__fastcall *)(__int64))-1LL && v80 )
8
            v80(v57);
9
          for ( i = 0; (unsigned int)v74 > (unsigned int)i; ++i )// 调内层so的.init_array
10
          {
11
            v59 = *(void (**)(void))(v77 + 8 * i);
12
            if ( v59 != (void (*)(void))-1LL && v59 )
13
              v59();
14
          }

1
 memcpy((void *)(shell_base + (unsigned int)dword_15084), (const void *)v116, v63);// 把内层 SysV hash 拷到外层 `0x15C000`
2
          memcpy(v64, v62, (unsigned int)dword_15064);// 把内层 dynsym 拷到外层 `0x159000`
3
          memcpy(v65, v61, (unsigned int)dword_15078);// 把内层 dynstr 拷到外层 `0x15B000`
4
          close(SHIDWORD(v105));

总结下来就是：

从 /proc/self/maps 定位当前 so 的真实文件路径
打开自身文件
读取尾部密钥材料
读取并解密内层 ELF 头
映射并解密包含 Program Header 的第一页
计算内层镜像范围并申请最终地址空间
逐段读取、XOR 解密、装载 PT_LOAD，完成 BSS
解析 PT_DYNAMIC
dlopen 依赖库
用自定义解析器做重定位
定位内层 JNI_OnLoad
调用 DT_INIT 和 INIT_ARRAY
把内层 hash/dynsym/dynstr 回填到外层壳的预留区
返回，等待外部以后通过外层库视图解析到内层符号

感觉和我之前写的差不多，但是我把加密的步骤前置了 so加固玩具版

主so解密#

1
from __future__ import annotations
2

3
import argparse
4
from pathlib import Path
5
import sys
6

7

8
PAYLOAD_OFFSET = 0x8000
9
TAIL_OFFSET = 0x1181DD
10
TAIL_SIZE = 0x14
11
HEADER_SIZE = 0x40
12
STREAM_KEY_SIZE = 16
13

14

15
def rc4_like_decrypt_header(enc_header: bytes, stream_key: bytes) -> bytes:
16
    if len(enc_header) != HEADER_SIZE:
17
        raise ValueError(f"expected {HEADER_SIZE:#x}-byte header, got {len(enc_header):#x}")
18
    if len(stream_key) != STREAM_KEY_SIZE:
19
        raise ValueError(f"expected {STREAM_KEY_SIZE} key bytes, got {len(stream_key)}")
20

21
    sbox = list(range(256))
22
    j = 0
23
    key_index = 0
24

25
    for i in range(256):
26
        j = (j + sbox[i] + stream_key[key_index]) & 0xFF
27
        sbox[i], sbox[j] = sbox[j], sbox[i]
28
        key_index = (key_index + 1) % STREAM_KEY_SIZE
29

30
    out = bytearray(enc_header)
31
    i = 0
32
    j = 0
33
    for pos in range(len(out)):
34
        i = (i + 1) & 0xFF
35
        t = sbox[i]
36
        j = (j + t) & 0xFF
37
        sbox[i], sbox[j] = sbox[j], t
38
        out[pos] ^= sbox[(sbox[i] + t) & 0xFF]
39

40
    return bytes(out)
41

42

43
def decrypt_libdexhelper_outer(outer_data: bytes) -> tuple[bytes, int]:
44
    min_size = TAIL_OFFSET + TAIL_SIZE
45
    if len(outer_data) < min_size:
46
        raise ValueError(
47
            f"file too small: need at least {min_size:#x} bytes, got {len(outer_data):#x}"
48
        )
49

50
    tail = outer_data[TAIL_OFFSET : TAIL_OFFSET + TAIL_SIZE]
51
    stream_key = tail[:STREAM_KEY_SIZE]
52
    body_xor_key = tail[STREAM_KEY_SIZE]
53

54
    payload = bytearray(outer_data[PAYLOAD_OFFSET:TAIL_OFFSET])
55
    if len(payload) < HEADER_SIZE:
56
        raise ValueError("embedded payload is smaller than the encrypted header")
57

58
    # The inner ELF body is XOR-encrypted with a single-byte key.
59
    for idx in range(HEADER_SIZE, len(payload)):
60
        payload[idx] ^= body_xor_key
61

62
    # The first 0x40 bytes are encrypted separately with the RC4-like routine.
63
    payload[:HEADER_SIZE] = rc4_like_decrypt_header(payload[:HEADER_SIZE], stream_key)
64

65
    return bytes(payload), body_xor_key
66

67

68
def build_default_output_path(input_path: Path) -> Path:
69
    if input_path.suffix:
70
        return input_path.with_name(f"{input_path.stem}.hidden.decrypted{input_path.suffix}")
71
    return input_path.with_name(f"{input_path.name}.hidden.decrypted.so")
72

73

74
def parse_args(argv: list[str]) -> argparse.Namespace:
75
    parser = argparse.ArgumentParser(
76
        description="Decrypt the hidden inner ELF from this protected libDexHelper.so sample."
77
    )
78
    parser.add_argument("input", type=Path, help="Path to the encrypted outer libDexHelper.so")
79
    parser.add_argument(
80
        "-o",
81
        "--output",
82
        type=Path,
83
        help="Output path for the decrypted inner ELF. Defaults next to the input file.",
84
    )
85
    return parser.parse_args(argv)
86

87

88
def main(argv: list[str]) -> int:
89
    args = parse_args(argv)
90
    input_path: Path = args.input
91
    output_path: Path = args.output or build_default_output_path(input_path)
92

93
    outer_data = input_path.read_bytes()
94
    inner_data, xor_key = decrypt_libdexhelper_outer(outer_data)
95

96
    if inner_data[:4] != b"\x7fELF":
97
        raise RuntimeError(
98
            "decryption completed, but the result does not start with ELF magic; "
99
            "double-check the sample matches this script."
100
        )
101

102
    output_path.write_bytes(inner_data)
103

104
    print(f"input : {input_path}")
105
    print(f"output: {output_path}")
106
    print(f"tail offset   : {TAIL_OFFSET:#x}")
107
    print(f"payload offset: {PAYLOAD_OFFSET:#x}")
108
    print(f"body xor key  : {xor_key:#x}")
109
    print(f"payload size  : {len(inner_data):#x}")
110
    print(f"elf magic     : {inner_data[:4].hex()}")
111

112
    return 0
113

114

115
if __name__ == "__main__":
116
    try:
117
        raise SystemExit(main(sys.argv[1:]))
118
    except Exception as exc:
119
        print(f"error: {exc}", file=sys.stderr)
120
        raise SystemExit(1)

运行一下，就要开始分析主so了捏

铺垫#

我们后面在hook主so里的函数时需要使用主so的基地址+函数偏移，但是主so是被映射到它自己mmap的匿名内存上的，这里有很多方案，我们选择相对优雅的一种

之前分析出了

1
real_base = mmap(v21, v22, 3, 34, -1, 0);   // 分配匿名内存，用于映射真正的so

我们直接hook mmap，根据后面四个参数值进行过滤即可，如果噪音过多，可以根据映射大小进一步过滤。过滤完可以看到只这样的

1
[+] inner base = 0x7c01620000
2
[+] mmap args  = addr=0x0 len=0x134000 prot=0x3 flags=0x22 fd=-1 off=0x0 ra=0x7c00c21888

1
var target_so = "libDexHelper.so";
2
var linker_name = Process.pointerSize === 8 ? "linker64" : "linker";
3
var call_constructors_offset = 0xb4900; // oriole / Pixel 6
4

5
var target_seen = false;
6
var found = false;
7
var mmap_hooked = false;
8

9
var outer_base = null;
10
var outer_size = 0;
11

12
function hook_mmap() {
13
    if (mmap_hooked) return;
14

15
    mmap_hooked = true;
16
    Interceptor.attach(Module.findExportByName("libc.so", "mmap"), {
17
        onEnter: function (args) {
18
            this.addr = args[0];
19
            this.len = args[1];
20
            this.prot = args[2].toInt32();
21
            this.flags = args[3].toInt32();
22
            this.fd = args[4].toInt32();
23
            this.off = args[5].toUInt32();
24
            this.ra = this.returnAddress;
25
        },
26
        onLeave: function (retval) {
27
            if (found || retval.isNull() || outer_base == null) return;
28

29
            let from_outer =
30
                this.ra.compare(outer_base) >= 0 &&
31
                this.ra.compare(outer_base.add(outer_size)) < 0;
32

33
            if (
34
                from_outer &&
35
                this.prot === 3 &&
36
                this.flags === 0x22 &&
37
                this.fd === -1 &&
38
                this.off === 0
39
            ) {
40
                found = true;
41
                console.log("[+] inner base =", retval);
42
                console.log(
43
                    "[+] mmap args  =",
44
                    "addr=" + this.addr,
45
                    "len=" + this.len,
46
                    "prot=0x" + this.prot.toString(16),
47
                    "flags=0x" + this.flags.toString(16),
48
                    "fd=" + this.fd,
49
                    "off=0x" + this.off.toString(16),
50
                    "ra=" + this.ra
51
                );
52
            }
53
        }
54
    });
55
}
56

57
function hook_linker_call_constructors() {
58
    if (hook_linker_call_constructors.hooked) return;
59
    hook_linker_call_constructors.hooked = true;
60

61
    let linker64_base_addr = Module.getBaseAddress(linker_name);
62
    if (!linker64_base_addr) return;
63

64
    let call_constructors = linker64_base_addr.add(call_constructors_offset);
65
    Interceptor.attach(call_constructors, {
66
        onEnter: function (args) {
67
            if (!target_seen || mmap_hooked || found) return;
68

69
            let secmodule = Process.findModuleByName(target_so);
70
            if (secmodule == null) return;
71

72
            outer_base = secmodule.base;
73
            outer_size = secmodule.size;
74
            hook_mmap();
75
        }
76
    });
77
}
78

79
function hook_dlopen() {
80
    Interceptor.attach(Module.findExportByName(null, "android_dlopen_ext"), {
81
        onEnter: function (args) {
82
            if (found) return;
83

84
            this.fileName = args[0].isNull() ? "" : args[0].readCString();
85
            if (this.fileName && this.fileName.indexOf(target_so) >= 0) {
86
                target_seen = true;
87
                hook_linker_call_constructors();
88
            }
89
        }
90
    });
91
}
92

93
hook_dlopen();

如此我们便可以知道映射大小=len=0x134000的时候的返回值是我们要的，我们就可以写出更简洁的脚本

1
var found = false;
2

3
Interceptor.attach(Module.findExportByName("libc.so", "mmap"), {
4
    onEnter: function (args) {
5
        this.len = args[1].toUInt32();
6
    },
7
    onLeave: function (retval) {
8
        if (found || retval.isNull()) return;
9

10
        if (this.len === 0x134000) {
11
            found = true;
12
            console.log("[+] inner base =", retval);
13
        }
14
    }
15
});

0x02 正文#

蓝蓝一片非常之爽，.init_array里没有注册函数，但是JNI_OnLoad反编译之后居然有3000行，那暂时先不看了

先来明确一下目标吧

过frida检测
静态解密dex完成脱壳

到现在为止还没咋使用到frida，但是不用想，附加上去启动app包是会崩溃的。目前已知所有重要逻辑入口都在JNI_OnLoad，那直接来trace一下函数调用链吧

0x02.1 frida检测绕过#

初步绕过#

这里使用到oacia大佬的stalker_trace_so，建议大家优先使用这个工具，他可以记录所有IDA识别出来并且被主线程执行到的函数，帮我们快速定位大致范围

需要注意的是生成的脚本在trace时基地址要稍作修改，因为它的主so是动态释放的

1
var so_name = "libDexHelper.so";
2
var inner_base = null;
3
var trace_started = false;
4
var found = false;
5
var mmap_listener = null;
6

7
/*
8
    @param print_stack: Whether printing stack info, default is false.
9
*/
10
var print_stack = false;
11

12
/*
13
    @param print_stack_mode
14
    - FUZZY: print as much stack info as possible
15
    - ACCURATE: print stack info as accurately as possible
16
    - MANUAL: if printing the stack info in an error and causes exit, use this option to manually print the address
17
*/
18
var print_stack_mode = "FUZZY";
19

20
function addr_in_so(addr){
21
    var process_Obj_Module_Arr = Process.enumerateModules();
22
    for(var i = 0; i < process_Obj_Module_Arr.length; i++) {
23
        if(addr>process_Obj_Module_Arr[i].base && addr<process_Obj_Module_Arr[i].base.add(process_Obj_Module_Arr[i].size)){
24
            console.log(addr.toString(16),"is in",process_Obj_Module_Arr[i].name,"offset: 0x"+(addr-process_Obj_Module_Arr[i].base).toString(16));
25
        }
26
    }
27
}
28

29
function hook_dlopen() {
30
    Interceptor.attach(Module.findExportByName(null, "android_dlopen_ext"),
31
        {
32
            onEnter: function (args) {
33
                var pathptr = args[0];
34
                if (pathptr !== undefined && pathptr != null) {
35
                    var path = ptr(pathptr).readCString();
36
                    //console.log(path);
37
                    if (path.indexOf(so_name) >= 0) {
38
                        this.is_can_hook = true;
39
                    }
40
                }
41
            },
42
            onLeave: function (retval) {
43
                if (this.is_can_hook && !trace_started) {
44
                    console.log("[+] mmap base   = " + inner_base);
45
                    console.log("[+] use mmap base = " + inner_base);
46

47
                    // note: you can do any thing before or after stalker trace so.
48
                    if (inner_base != null) {
49
                        if (mmap_listener != null) {
50
                            mmap_listener.detach();
51
                            mmap_listener = null;
52
                            console.log("[+] mmap hook detached");
53
                        }
54
                        trace_so();
55
                    }
56
                }
57
            }
58
        }
59
    );
60
}
61

62
function hook_mmap() {
63
    mmap_listener = Interceptor.attach(Module.findExportByName("libc.so", "mmap"), {
64
        onEnter: function (args) {
65
            this.len = args[1].toUInt32();
66
        },
67
        onLeave: function (retval) {
68
            if (found || retval.isNull()) return;
69

70
            if (this.len === 0x134000) {
71
                found = true;
72
                inner_base = ptr(retval.toString());
73
                console.log("[+] inner base = " + inner_base);
74
            }
75
        }
76
    });
77
}
78

79
function trace_so(){
80
    if (inner_base == null || trace_started) return;
81

82
    trace_started = true;
83
    var times = 1;
84
    var module_base = inner_base;
85
    var pid = Process.getCurrentThreadId();
86
    console.log("start Stalker!");
87
    Stalker.exclude({
88
        "base": Process.getModuleByName("libc.so").base,
89
        "size": Process.getModuleByName("libc.so").size
90
    })
91
    Stalker.follow(pid,{
92
        events:{
93
            call:false,
94
            ret:false,
95
            exec:false,
96
            block:false,
97
            compile:false
98
        },
99
        onReceive:function(events){
100
        },
101
        transform: function (iterator) {
102
            var instruction = iterator.next();
103
            do{
104
                var offset = instruction.address.sub(module_base).toUInt32();
105
                var index = func_addr.indexOf(offset);
106
                if (index !== -1) {
107
                    console.log("call" + times + ":" + func_name[index])
108
                    times = times + 1
109
                    if (print_stack) {
110
                        if (print_stack_mode === "FUZZY") {
111
                            iterator.putCallout((context) => {
112
                                console.log("backtrace:\n"+Thread.backtrace(context, Backtracer.FUZZY).map(DebugSymbol.fromAddress).join('\n'));
113
                                console.log('---------------------')
114
                            });
115
                        }
116
                        else if (print_stack_mode === "ACCURATE") {
117
                            iterator.putCallout((context) => {
118
                                console.log("backtrace:\n"+Thread.backtrace(context, Backtracer.ACCURATE).map(DebugSymbol.fromAddress).join('\n'));
119
                                console.log('---------------------')
120
                            })
121
                        }
122

123
                        else if (print_stack_mode === "MANUAL") {
124
                            iterator.putCallout((context) => {
125
                                console.log("backtrace:")
126
                                Thread.backtrace(context, Backtracer.FUZZY).map(addr_in_so);
127
                                console.log('---------------------')
128
                            })
129
                        }
130
                    }
131
                }
132
                iterator.keep();
133
            } while ((instruction = iterator.next()) !== null);
134
        },
135

136
        onCallSummary:function(summary){
137

138
        }
139
    });
140
    console.log("Stalker end!");
141
}
142

143
hook_mmap();
144
setImmediate(hook_dlopen,0);

只看最后几条日志

1
call107:sub_402CC
2
call108:sub_3ED48
3
call109:regfree
4
call110:usleep
5
call111:dlopen
6
call112:dlsym
7
call113:sub_AED04
8
call114:sub_AE270
9
call115:sub_AEA58
10
call116:mmap
11
call117:sub_AF28C
12
call118:sub_AF4C8
13
call119:sub_AEE3C
14
call120:stat
15
call121:dlclose
16
call122:sub_42868
17
call123:sub_1304C

直接hook sub_1304C试试看，当然这样不严谨，但是可以快速看看有没有效果

1
Spawned `com.moutai.mall`. Resuming main thread!
2
[Pixel 6::com.moutai.mall ]-> [+] inner base = 0x7c00ce9000
3
[+] mmap hook detached
4
[+] patched sub_1304C @ 0x7c00cfc04c
5
[+] dlopen hook detached
6
Process terminated
7
[Pixel 6::com.moutai.mall ]->

依旧崩了，但是这次的崩溃相较上一次正常的多，判断为不是被同一处检测点检测到了，把hook sub_1304C的逻辑加上，再trace一次

1
function rep_sub1304C() {
2
    if (inner_base == null || sub1304c_replaced) return;
3

4
    var target = inner_base.add(0x1304c);
5
    console.log("[+] replacing sub_1304C @ " + target);
6

7
    Interceptor.replace(target, new NativeCallback(function (a0, a1, a2) {
8
        console.log(
9
            "[+] skip sub_1304C(flag=" + a0.toString() +
10
            ", code=0x" + a1.toString(16) +
11
            ", mask=0x" + a2.toString(16) + ")"
12
        );
13
        return 0;
14
    }, 'int64', ['int64', 'uint32', 'int']));
15

16
    sub1304c_replaced = true;
17
}

这次的日志的最后几行

1
call188:sub_24F18
2
call189:.strcasecmp
3
call190:sub_105B8
4
call191:sub_FE78
5
call192:sub_40B04
6
call193:sub_3DBB4
7
call194:sub_3DF50
8
call195:sub_406E8
9
call196:sub_41838
10
call197:sub_408C4
11
Process terminated
12
[Pixel 6::com.moutai.mall ]->

初步看了一下，上面几个没啥可疑的，估计就是检测到了然后正常退出，这里由于最后几条函数并不是检测函数和退出函数，所以这里大概率不是同步的检测。或者还有一种可能，假设函数B是检函数，函数A调用B，然后根据B的返回结果决定是否退出App。当前trace脚本只能记录“执行流进入了哪些函数入口”，但没有记录“函数返回到了哪里”以及“调用者在拿到返回值后又执行了什么分支逻辑”，所以只能看到A和B都执行过，却不一定能定位到 A 在函数内部哪一条指令上完成了退出。

进一步绕过#

搞这里也是时间有点晚了，我也懒得跟他废话了，直接用内核模块监控一下哪里给我app干崩了(上文已经分析出此处的崩溃是正常的退出)

1
[43097.547378] [Yuuki] === kill_monitor: kill (PID:19581 UID:10282 com.moutai.mall) sig=9 ===
2
[43097.547388] [Yuuki] [UID 10282] #00 pc = 0x7c007720a4 ???!0x190a4
3
[43097.547390] [Yuuki] [UID 10282] #01 pc = 0x7d41443600 [anon:scudo:primary_reserve]!0xabf7600
4
[43097.547392] [Yuuki] === end backtrace (2 frames) ===
5
[43097.547394] [Yuuki]
6
[43097.548342] [Yuuki] === kill_monitor: kill (PID:19581 UID:10282 com.moutai.mall) sig=9 ===
7
[43097.548346] [Yuuki] [UID 10282] #00 pc = 0x7c00772424 ???!0x19424
8
[43097.548348] [Yuuki] [UID 10282] #01 pc = 0x7d41443600 [anon:scudo:primary_reserve]!0xabf7600
9
[43097.548351] [Yuuki] === end backtrace (2 frames) ===
10
[43097.548353] [Yuuki]

一共两处，IDA跳过去看看

两处都是直接svc call __NR_kill函数直接退的，果然是像我们上面猜测的那样，我们直接给它们patch掉就行了

1
var target_so = "libDexHelper.so";
2
var inner_base = null;
3
var found = false;
4
var patched = false;
5
var callbacks = [];
6
var mmap_listener = null;
7
var dlopen_listener = null;
8

9
function patchArm64MovX0Zero(addr, tag) {
10
    Memory.patchCode(addr, 4, function (code) {
11
        var writer = new Arm64Writer(code, { pc: addr });
12
        writer.putMovRegReg("x0", "xzr");
13
        writer.flush();
14
    });
15
    console.log("[+] patched " + tag + " @ " + addr + " (mov x0, xzr)");
16
}
17

18
function applyPatches() {
19
    if (patched || inner_base == null) return;
20

21
    var sub1304c = inner_base.add(0x1304c);
22
    var cb = new NativeCallback(function () {
23
        return 0;
24
    }, "int", []);
25

26
    callbacks.push(cb);
27
    Interceptor.replace(sub1304c, cb);
28
    console.log("[+] patched sub_1304C @ " + sub1304c);
29

30
    patchArm64MovX0Zero(inner_base.add(0x190a0), "kill syscall #1");
31
    patchArm64MovX0Zero(inner_base.add(0x19420), "kill syscall #2");
32

33
    patched = true;
34
}
35

36
mmap_listener = Interceptor.attach(Module.findExportByName("libc.so", "mmap"), {
37
    onEnter: function (args) {
38
        this.len = args[1].toUInt32();
39
    },
40
    onLeave: function (retval) {
41
        if (found || retval.isNull()) return;
42

43
        if (this.len === 0x134000) {
44
            found = true;
45
            inner_base = ptr(retval.toString());
46
            console.log("[+] inner base = " + inner_base);
47
            if (mmap_listener) {
48
                mmap_listener.detach();
49
                mmap_listener = null;
50
                console.log("[+] mmap hook detached");
51
            }
52
        }
53
    }
54
});
55

56
dlopen_listener = Interceptor.attach(Module.findExportByName(null, "android_dlopen_ext"), {
57
    onEnter: function (args) {
58
        this.fileName = args[0].isNull() ? "" : args[0].readCString();
59
    },
60
    onLeave: function (retval) {
61
        if (patched) return;
62

63
        if (this.fileName && this.fileName.indexOf(target_so) >= 0 && inner_base != null) {
64
            applyPatches();
65
            if (dlopen_listener) {
66
                dlopen_listener.detach();
67
                dlopen_listener = null;
68
                console.log("[+] dlopen hook detached");
69
            }
70
        }
71
    }
72
});

直接注入启动，app完美运行，美美得吃了也是

但是这种方式并不是很优雅，毕竟不是每个人都能用内核模块。值得注意的是上面两个退出点都在JNI_OnLoad函数中，这就很值得注意了，正常检测逻辑怎么会放在这个函数中呢？我觉得只有傻*才会这样写代码，所以这里JNI_OnLoad只是起到一个最终的决策作用。具体来说就是JNI_OnLoad里通过无论是新建线程还是直接同步调用函数的方式，去启动检测函数，然后不在检测函里执行退出机制，而是拿到检测函数的结果，集中在JNI_OnLoad里进行处理。当然这些只是我的猜测，至于为什么这么做，可能是因为JNI_OnLoad经过了混淆，开发者觉得大多数逆向人员不会去优先看这个函数。事实也的确如此

有的朋友通过hook clone那套 + 处理sub_1304C也能绕过检测，但是我感觉这样比较麻烦

更一般的方式#

我们继续来优雅(暴力)的解决刚刚的问题吧

已知退出是正常的退出，只是通过svc直接call内核函数而已。这里可以有一些大众的处理方案

直接trace指令，注册svc的callback，打印内核函数名和参数就行了，直接就能定位到第一现场。这个我是尝试了一下，确实是可行的
直接IDA扫所有svc指令，反向污点确定x8寄存器的值，根据系统调用号(Android arm64 系统调用号是存在x8寄存器的)进行过滤，然后全都patch掉

这里我们直接选择方案二，因为它足够简单，直接写个IDA脚本，帮我们生成对应的frida patch脚本代码，这里我只处理了 exit， exit_group，kill，tkill，tgkill，其他的退出方式并没有做处理，抛砖引玉感兴趣的大佬可以自行拓展

1
import os
2
import re
3

4
import idautils
5
import ida_bytes
6
import ida_funcs
7
import ida_kernwin
8
import ida_segment
9
import idc
10

11

12
TARGET_SYSCALLS = {
13
    93: "exit",
14
    94: "exit_group",
15
    129: "kill",
16
    130: "tkill",
17
    131: "tgkill",
18
}
19
BACKTRACK_LIMIT = 20
20
PATCH_FILE_NAME = "termination_patch_snippet.txt"
21

22

23
def log(msg=""):
24
    print(msg)
25

26

27
def is_exec_seg(seg):
28
    if seg is None:
29
        return False
30
    return bool(seg.perm & ida_segment.SEGPERM_EXEC)
31

32

33
def iter_exec_heads():
34
    for seg_ea in idautils.Segments():
35
        seg = ida_segment.getseg(seg_ea)
36
        if not is_exec_seg(seg):
37
            continue
38
        ea = seg.start_ea
39
        while ea < seg.end_ea:
40
            flags = ida_bytes.get_flags(ea)
41
            if ida_bytes.is_code(flags):
42
                yield ea
43
            ea = idc.next_head(ea, seg.end_ea)
44

45

46
def op_text(ea, n):
47
    text = idc.print_operand(ea, n)
48
    return text.strip() if text else ""
49

50

51
def mnem(ea):
52
    return idc.print_insn_mnem(ea).lower()
53

54

55
def normalize_reg(text):
56
    return text.lower().strip()
57

58

59
def is_x8_reg(text):
60
    reg = normalize_reg(text)
61
    return reg in ("x8", "w8")
62

63

64
def parse_imm_and_shift(text):
65
    """
66
    Parse operand text forms like:
67
      #0x81
68
      #0xb6a2,LSL#16
69
      #123
70
    Returns (imm, shift_bits).
71
    """
72
    t = text.lower().replace(" ", "")
73
    m = re.match(r"#(?P<imm>-?(?:0x[0-9a-f]+|\d+))(?:,lsl#(?P<shift>\d+))?$", t)
74
    if not m:
75
        return None
76
    imm = int(m.group("imm"), 0)
77
    shift = int(m.group("shift") or 0)
78
    return imm, shift
79

80

81
def writes_x8(ea):
82
    return is_x8_reg(op_text(ea, 0))
83

84

85
def decode_syscall_from_backtrack(svc_ea, limit=BACKTRACK_LIMIT):
86
    """
87
    Heuristically reconstruct x8 value by scanning backwards.
88

89
    Supports common forms:
90
      MOV   X8, #imm
91
      MOVZ  X8, #imm[, LSL#n]
92
      MOVK  X8, #imm[, LSL#n]
93
      ORR   X8, XZR, #imm
94

95
    Returns:
96
      {
97
        "sysno": int or None,
98
        "writer_eas": [ea...],  # instructions contributing to x8
99
      }
100
    """
101
    func = ida_funcs.get_func(svc_ea)
102
    if not func:
103
        return {"sysno": None, "writer_eas": []}
104

105
    cur = idc.prev_head(svc_ea, func.start_ea)
106
    seen = 0
107
    pieces = []
108
    writer_eas = []
109

110
    while cur != idc.BADADDR and cur >= func.start_ea and seen < limit:
111
        seen += 1
112
        insn_mnem = mnem(cur)
113

114
        if writes_x8(cur):
115
            writer_eas.append(cur)
116

117
            if insn_mnem in ("mov", "movz"):
118
                parsed = parse_imm_and_shift(op_text(cur, 1))
119
                if parsed is None:
120
                    return {"sysno": None, "writer_eas": writer_eas}
121
                imm, shift = parsed
122
                value = imm << shift
123
                for part_shift, part_imm in pieces:
124
                    mask = 0xFFFF << part_shift
125
                    value = (value & ~mask) | ((part_imm & 0xFFFF) << part_shift)
126
                return {"sysno": value, "writer_eas": writer_eas}
127

128
            if insn_mnem == "movk":
129
                parsed = parse_imm_and_shift(op_text(cur, 1))
130
                if parsed is None:
131
                    return {"sysno": None, "writer_eas": writer_eas}
132
                imm, shift = parsed
133
                pieces.append((shift, imm))
134
                cur = idc.prev_head(cur, func.start_ea)
135
                continue
136

137
            if insn_mnem == "orr":
138
                src1 = normalize_reg(op_text(cur, 1))
139
                parsed = parse_imm_and_shift(op_text(cur, 2))
140
                if src1 == "xzr" and parsed is not None:
141
                    imm, shift = parsed
142
                    value = imm << shift
143
                    return {"sysno": value, "writer_eas": writer_eas}
144
                return {"sysno": None, "writer_eas": writer_eas}
145

146
            return {"sysno": None, "writer_eas": writer_eas}
147

148
        cur = idc.prev_head(cur, func.start_ea)
149

150
    return {"sysno": None, "writer_eas": writer_eas}
151

152

153
def nearby_insns(ea, before=10, after=2):
154
    items = []
155
    cur = ea
156
    for _ in range(before):
157
        cur = idc.prev_head(cur, idc.get_segm_start(cur))
158
        if cur == idc.BADADDR:
159
            break
160
    count = before + after + 1
161
    while cur != idc.BADADDR and count > 0:
162
        items.append((cur, idc.GetDisasm(cur)))
163
        nxt = idc.next_head(cur, idc.get_segm_end(cur))
164
        if nxt == idc.BADADDR or nxt == cur:
165
            break
166
        cur = nxt
167
        count -= 1
168
    return items
169

170

171
def make_patch_lines(matches):
172
    lines = []
173
    lines.append("// auto-generated by search_kill.py")
174
    lines.append("function patchArm64MovX0Zero(addr, tag) {")
175
    lines.append("    Memory.patchCode(addr, 4, function (code) {")
176
    lines.append("        var writer = new Arm64Writer(code, { pc: addr });")
177
    lines.append('        writer.putMovRegReg("x0", "xzr");')
178
    lines.append("        writer.flush();")
179
    lines.append("    });")
180
    lines.append('    console.log("[+] patched " + tag + " @ " + addr + " (mov x0, xzr)");')
181
    lines.append("}")
182
    lines.append("")
183
    for idx, item in enumerate(matches, 1):
184
        tag = "%s syscall(%d) #%d @ 0x%x" % (
185
            item["sys_name"],
186
            item["sysno"],
187
            idx,
188
            item["svc_ea"],
189
        )
190
        lines.append("// %s (%d)" % (item["sys_name"], item["sysno"]))
191
        lines.append('patchArm64MovX0Zero(inner_base.add(0x%x), "%s");' % (item["svc_ea"], tag))
192
    return "\n".join(lines)
193

194

195
def write_snippet_file(text):
196
    out_dir = os.path.dirname(idc.get_idb_path()) or os.getcwd()
197
    out_path = os.path.join(out_dir, PATCH_FILE_NAME)
198
    try:
199
        with open(out_path, "w", encoding="utf-8") as fp:
200
            fp.write(text)
201
        return out_path
202
    except Exception as exc:
203
        log("[!] failed to write snippet file: %s" % exc)
204
        return None
205

206

207
def main():
208
    matches = []
209

210
    for ea in iter_exec_heads():
211
        if mnem(ea) != "svc":
212
            continue
213

214
        info = decode_syscall_from_backtrack(ea)
215
        if info["sysno"] not in TARGET_SYSCALLS:
216
            continue
217

218
        func = ida_funcs.get_func(ea)
219
        func_name = idc.get_func_name(ea) if func else "<no_func>"
220

221
        matches.append({
222
            "svc_ea": ea,
223
            "func_start": func.start_ea if func else idc.BADADDR,
224
            "func_name": func_name,
225
            "writer_eas": list(reversed(info["writer_eas"])),
226
            "sysno": info["sysno"],
227
            "sys_name": TARGET_SYSCALLS[info["sysno"]],
228
            "nearby": nearby_insns(ea),
229
        })
230

231
    if not matches:
232
        msg = "[*] no target termination syscall svc sites found"
233
        log(msg)
234
        ida_kernwin.info(msg)
235
        return
236

237
    matches.sort(key=lambda x: (x["sysno"], x["svc_ea"]))
238

239
    log("[*] found %d target termination syscall site(s)" % len(matches))
240
    log("")
241

242
    for idx, item in enumerate(matches, 1):
243
        log("=" * 72)
244
        log("[%d] svc @ 0x%x  func=%s @ 0x%x  %s (sysno=%d / 0x%x)" % (
245
            idx,
246
            item["svc_ea"],
247
            item["func_name"],
248
            item["func_start"],
249
            item["sys_name"],
250
            item["sysno"],
251
            item["sysno"],
252
        ))
253
        if item["writer_eas"]:
254
            log("    x8 writers:")
255
            for w in item["writer_eas"]:
256
                log("      0x%x  %s" % (w, idc.GetDisasm(w)))
257
        else:
258
            log("    x8 writers: <unresolved>")
259
        log("    nearby:")
260
        for ea, text in item["nearby"]:
261
            mark = ">>" if ea == item["svc_ea"] else "  "
262
            log("    %s 0x%x  %s" % (mark, ea, text))
263
        log("")
264

265
    snippet = make_patch_lines(matches)
266
    out_path = write_snippet_file(snippet)
267

268
    log("=" * 72)
269
    log("[*] bypass.js snippet:")
270
    log(snippet)
271
    log("")
272
    if out_path:
273
        log("[*] snippet saved to: %s" % out_path)
274

275
    ida_kernwin.info("search_kill.py finished, found %d target termination svc site(s)" % len(matches))
276

277

278
if __name__ == "__main__":
279
    main()

加上我们之前对 sub_1304C的处理，就可以完美绕过啦~

完整代码如下：

1
var target_so = "libDexHelper.so";
2
var inner_base = null;
3
var found = false;
4
var patched = false;
5
var callbacks = [];
6
var mmap_listener = null;
7
var dlopen_listener = null;
8

9
function patchArm64MovX0Zero(addr, tag) {
10
    Memory.patchCode(addr, 4, function (code) {
11
        var writer = new Arm64Writer(code, { pc: addr });
12
        writer.putMovRegReg("x0", "xzr");
13
        writer.flush();
14
    });
15
    console.log("[+] patched " + tag + " @ " + addr + " (mov x0, xzr)");
16
}
17

18
function applyPatches() {
19
    if (patched || inner_base == null) return;
20

21
    var sub1304c = inner_base.add(0x1304c);
22
    var cb = new NativeCallback(function () {
23
        return 0;
24
    }, "int", []);
25

26
    callbacks.push(cb);
27
    Interceptor.replace(sub1304c, cb);
28
    console.log("[+] patched sub_1304C @ " + sub1304c);
29

30
    // 精准的patch只需这两处
31
    // patchArm64MovX0Zero(inner_base.add(0x190a0), "kill syscall #1");
32
    // patchArm64MovX0Zero(inner_base.add(0x19420), "kill syscall #2");
33

34
    // kill (129)
35
    patchArm64MovX0Zero(inner_base.add(0x17558), "kill syscall(129) #1 @ 0x17558");
36
    // kill (129)
37
    patchArm64MovX0Zero(inner_base.add(0x17614), "kill syscall(129) #2 @ 0x17614");
38
    // kill (129)
39
    patchArm64MovX0Zero(inner_base.add(0x176ec), "kill syscall(129) #3 @ 0x176ec");
40
    // kill (129)
41
    patchArm64MovX0Zero(inner_base.add(0x17a7c), "kill syscall(129) #4 @ 0x17a7c");
42
    // kill (129)
43
    patchArm64MovX0Zero(inner_base.add(0x17af0), "kill syscall(129) #5 @ 0x17af0");
44
    // kill (129)
45
    patchArm64MovX0Zero(inner_base.add(0x190a0), "kill syscall(129) #6 @ 0x190a0");
46
    // kill (129)
47
    patchArm64MovX0Zero(inner_base.add(0x1925c), "kill syscall(129) #7 @ 0x1925c");
48
    // kill (129)
49
    patchArm64MovX0Zero(inner_base.add(0x19420), "kill syscall(129) #8 @ 0x19420");
50
    // kill (129)
51
    patchArm64MovX0Zero(inner_base.add(0x25fb0), "kill syscall(129) #9 @ 0x25fb0");
52
    // kill (129)
53
    patchArm64MovX0Zero(inner_base.add(0x4f3a0), "kill syscall(129) #10 @ 0x4f3a0");
54
    // kill (129)
55
    patchArm64MovX0Zero(inner_base.add(0x4f5d4), "kill syscall(129) #11 @ 0x4f5d4");
56
    // kill (129)
57
    patchArm64MovX0Zero(inner_base.add(0x4febc), "kill syscall(129) #12 @ 0x4febc");
58
    // kill (129)
59
    patchArm64MovX0Zero(inner_base.add(0x55368), "kill syscall(129) #13 @ 0x55368");
60
    // kill (129)
61
    patchArm64MovX0Zero(inner_base.add(0x56588), "kill syscall(129) #14 @ 0x56588");
62

63
    patched = true;
64
}
65

66
mmap_listener = Interceptor.attach(Module.findExportByName("libc.so", "mmap"), {
67
    onEnter: function (args) {
68
        this.len = args[1].toUInt32();
69
    },
70
    onLeave: function (retval) {
71
        if (found || retval.isNull()) return;
72

73
        if (this.len === 0x134000) {
74
            found = true;
75
            inner_base = ptr(retval.toString());
76
            console.log("[+] inner base = " + inner_base);
77
            if (mmap_listener) {
78
                mmap_listener.detach();
79
                mmap_listener = null;
80
                console.log("[+] mmap hook detached");
81
            }
82
        }
83
    }
84
});
85

86
dlopen_listener = Interceptor.attach(Module.findExportByName(null, "android_dlopen_ext"), {
87
    onEnter: function (args) {
88
        this.fileName = args[0].isNull() ? "" : args[0].readCString();
89
    },
90
    onLeave: function (retval) {
91
        if (patched) return;
92

93
        if (this.fileName && this.fileName.indexOf(target_so) >= 0 && inner_base != null) {
94
            applyPatches();
95
            if (dlopen_listener) {
96
                dlopen_listener.detach();
97
                dlopen_listener = null;
98
                console.log("[+] dlopen hook detached");
99
            }
100
        }
101
    }
102
});

0x03 小结#

很早以前就读壳感兴趣，但是一直没有时间研究。这次特意选了安卓端最简单的壳进行分析。之前不懂为什么那么多国家相关的APP，以及一些大银行，都喜欢用这个的壳，明明比它强的壳还有很多。最近和朋友聊天时问了这个问题。他跟我说，很多东西不是技术层面的问题，而是法律层面的。恍然大悟了也是

这篇篇幅还是有点太短了，剩下的dex解密流程分析过两天回学校有空了再写吧ovo

使用到的一些工具以及文章：

stalker_trace_so