1 /* Capstone Disassembler Engine */
2 /* By Nguyen Anh Quynh <aquynh@gmail.com>, 2013> */
3 
4 #include <stdio.h>
5 #include <stdlib.h>
6 
7 #include <platform.h>
8 #include <capstone.h>
9 
10 struct platform {
11 	cs_arch arch;
12 	cs_mode mode;
13 	unsigned char *code;
14 	size_t size;
15 	char *comment;
16 	cs_opt_type opt_type;
17 	cs_opt_value opt_value;
18 };
19 
print_string_hex(unsigned char * str,size_t len)20 static void print_string_hex(unsigned char *str, size_t len)
21 {
22 	unsigned char *c;
23 
24 	printf("Code: ");
25 	for (c = str; c < str + len; c++) {
26 		printf("0x%02x ", *c & 0xff);
27 	}
28 	printf("\n");
29 }
30 
test()31 static void test()
32 {
33 #define X86_CODE16 "\x8d\x4c\x32\x08\x01\xd8\x81\xc6\x34\x12\x00\x00"
34 #define X86_CODE32 "\x8d\x4c\x32\x08\x01\xd8\x81\xc6\x34\x12\x00\x00"
35 //#define X86_CODE32 "\x0f\xa7\xc0"	// xstorerng
36 #define X86_CODE64 "\x55\x48\x8b\x05\xb8\x13\x00\x00"
37 //#define ARM_CODE "\x04\xe0\x2d\xe5"
38 #define ARM_CODE "\xED\xFF\xFF\xEB\x04\xe0\x2d\xe5\x00\x00\x00\x00\xe0\x83\x22\xe5\xf1\x02\x03\x0e\x00\x00\xa0\xe3\x02\x30\xc1\xe7\x00\x00\x53\xe3"
39 #define ARM_CODE2 "\x10\xf1\x10\xe7\x11\xf2\x31\xe7\xdc\xa1\x2e\xf3\xe8\x4e\x62\xf3"
40 #define ARMV8 "\xe0\x3b\xb2\xee\x42\x00\x01\xe1\x51\xf0\x7f\xf5"
41 #define THUMB_MCLASS "\xef\xf3\x02\x80"
42 #define THUMB_CODE "\x70\x47\xeb\x46\x83\xb0\xc9\x68"
43 #define THUMB_CODE2 "\x4f\xf0\x00\x01\xbd\xe8\x00\x88\xd1\xe8\x00\xf0"
44 #define MIPS_CODE "\x0C\x10\x00\x97\x00\x00\x00\x00\x24\x02\x00\x0c\x8f\xa2\x00\x00\x34\x21\x34\x56"
45 #define MIPS_CODE2 "\x56\x34\x21\x34\xc2\x17\x01\x00"
46 #define MIPS_32R6M "\x00\x07\x00\x07\x00\x11\x93\x7c\x01\x8c\x8b\x7c\x00\xc7\x48\xd0"
47 #define MIPS_32R6 "\xec\x80\x00\x19\x7c\x43\x22\xa0"
48 //#define ARM64_CODE "\x00\x40\x21\x4b"	// 	sub		w0, w0, w1, uxtw
49 //#define ARM64_CODE "\x21\x7c\x02\x9b"	// mul	x1, x1, x2
50 //#define ARM64_CODE "\x20\x74\x0b\xd5"	// dc	zva, x0
51 //#define ARM64_CODE "\xe1\x0b\x40\xb9"	// ldr		w1, [sp, #0x8]
52 #define ARM64_CODE "\x21\x7c\x02\x9b\x21\x7c\x00\x53\x00\x40\x21\x4b\xe1\x0b\x40\xb9"
53 #define PPC_CODE "\x80\x20\x00\x00\x80\x3f\x00\x00\x10\x43\x23\x0e\xd0\x44\x00\x80\x4c\x43\x22\x02\x2d\x03\x00\x80\x7c\x43\x20\x14\x7c\x43\x20\x93\x4f\x20\x00\x21\x4c\xc8\x00\x21"
54 #define SPARC_CODE "\x80\xa0\x40\x02\x85\xc2\x60\x08\x85\xe8\x20\x01\x81\xe8\x00\x00\x90\x10\x20\x01\xd5\xf6\x10\x16\x21\x00\x00\x0a\x86\x00\x40\x02\x01\x00\x00\x00\x12\xbf\xff\xff\x10\xbf\xff\xff\xa0\x02\x00\x09\x0d\xbf\xff\xff\xd4\x20\x60\x00\xd4\x4e\x00\x16\x2a\xc2\x80\x03"
55 #define SPARCV9_CODE "\x81\xa8\x0a\x24\x89\xa0\x10\x20\x89\xa0\x1a\x60\x89\xa0\x00\xe0"
56 #define SYSZ_CODE "\xed\x00\x00\x00\x00\x1a\x5a\x0f\x1f\xff\xc2\x09\x80\x00\x00\x00\x07\xf7\xeb\x2a\xff\xff\x7f\x57\xe3\x01\xff\xff\x7f\x57\xeb\x00\xf0\x00\x00\x24\xb2\x4f\x00\x78"
57 #define XCORE_CODE "\xfe\x0f\xfe\x17\x13\x17\xc6\xfe\xec\x17\x97\xf8\xec\x4f\x1f\xfd\xec\x37\x07\xf2\x45\x5b\xf9\xfa\x02\x06\x1b\x10"
58 	struct platform {
59 		cs_arch arch;
60 		cs_mode mode;
61 		unsigned char *code;
62 		size_t size;
63 		char *comment;
64 		cs_opt_type opt_type;
65 		cs_opt_value opt_value;
66 	};
67 	struct platform platforms[] = {
68 		{
69 			CS_ARCH_X86,
70 			CS_MODE_16,
71 			(unsigned char*)X86_CODE16,
72 			sizeof(X86_CODE16) - 1,
73 			"X86 16bit (Intel syntax)"
74 		},
75 		{
76 			CS_ARCH_X86,
77 			CS_MODE_32,
78 			(unsigned char*)X86_CODE32,
79 			sizeof(X86_CODE32) - 1,
80 			"X86 32bit (ATT syntax)",
81 			CS_OPT_SYNTAX,
82 			CS_OPT_SYNTAX_ATT,
83 		},
84 		{
85 			CS_ARCH_X86,
86 			CS_MODE_32,
87 			(unsigned char*)X86_CODE32,
88 			sizeof(X86_CODE32) - 1,
89 			"X86 32 (Intel syntax)"
90 		},
91 		{
92 			CS_ARCH_X86,
93 			CS_MODE_64,
94 			(unsigned char*)X86_CODE64,
95 			sizeof(X86_CODE64) - 1,
96 			"X86 64 (Intel syntax)"
97 		},
98 		{
99 			CS_ARCH_ARM,
100 			CS_MODE_ARM,
101 			(unsigned char*)ARM_CODE,
102 			sizeof(ARM_CODE) - 1,
103 			"ARM"
104 		},
105 		{
106 			CS_ARCH_ARM,
107 			CS_MODE_THUMB,
108 			(unsigned char*)THUMB_CODE2,
109 			sizeof(THUMB_CODE2) - 1,
110 			"THUMB-2"
111 		},
112 		{
113 			CS_ARCH_ARM,
114 			CS_MODE_ARM,
115 			(unsigned char*)ARM_CODE2,
116 			sizeof(ARM_CODE2) - 1,
117 			"ARM: Cortex-A15 + NEON"
118 		},
119 		{
120 			CS_ARCH_ARM,
121 			CS_MODE_THUMB,
122 			(unsigned char*)THUMB_CODE,
123 			sizeof(THUMB_CODE) - 1,
124 			"THUMB"
125 		},
126 		{
127 			CS_ARCH_ARM,
128 			(cs_mode)(CS_MODE_THUMB + CS_MODE_MCLASS),
129 			(unsigned char*)THUMB_MCLASS,
130 			sizeof(THUMB_MCLASS) - 1,
131 			"Thumb-MClass"
132 		},
133 		{
134 			CS_ARCH_ARM,
135 			(cs_mode)(CS_MODE_ARM + CS_MODE_V8),
136 			(unsigned char*)ARMV8,
137 			sizeof(ARMV8) - 1,
138 			"Arm-V8"
139 		},
140 		{
141 			CS_ARCH_MIPS,
142 			(cs_mode)(CS_MODE_MIPS32 + CS_MODE_BIG_ENDIAN),
143 			(unsigned char*)MIPS_CODE,
144 			sizeof(MIPS_CODE) - 1,
145 			"MIPS-32 (Big-endian)"
146 		},
147 		{
148 			CS_ARCH_MIPS,
149 			(cs_mode)(CS_MODE_MIPS64 + CS_MODE_LITTLE_ENDIAN),
150 			(unsigned char*)MIPS_CODE2,
151 			sizeof(MIPS_CODE2) - 1,
152 			"MIPS-64-EL (Little-endian)"
153 		},
154 		{
155 			CS_ARCH_MIPS,
156 			(cs_mode)(CS_MODE_MIPS32R6 + CS_MODE_MICRO + CS_MODE_BIG_ENDIAN),
157 			(unsigned char*)MIPS_32R6M,
158 			sizeof(MIPS_32R6M) - 1,
159 			"MIPS-32R6 | Micro (Big-endian)"
160 		},
161 		{
162 			CS_ARCH_MIPS,
163 			(cs_mode)(CS_MODE_MIPS32R6 + CS_MODE_BIG_ENDIAN),
164 			(unsigned char*)MIPS_32R6,
165 			sizeof(MIPS_32R6) - 1,
166 			"MIPS-32R6 (Big-endian)"
167 		},
168 		{
169 			CS_ARCH_ARM64,
170 			CS_MODE_ARM,
171 			(unsigned char*)ARM64_CODE,
172 			sizeof(ARM64_CODE) - 1,
173 			"ARM-64"
174 		},
175 		{
176 			CS_ARCH_PPC,
177 			CS_MODE_BIG_ENDIAN,
178 			(unsigned char*)PPC_CODE,
179 			sizeof(PPC_CODE) - 1,
180 			"PPC-64"
181 		},
182 		{
183 			CS_ARCH_PPC,
184 			CS_MODE_BIG_ENDIAN,
185 			(unsigned char*)PPC_CODE,
186 			sizeof(PPC_CODE) - 1,
187 			"PPC-64, print register with number only",
188 			CS_OPT_SYNTAX,
189 			CS_OPT_SYNTAX_NOREGNAME
190 		},
191 		{
192 			CS_ARCH_SPARC,
193 			CS_MODE_BIG_ENDIAN,
194 			(unsigned char*)SPARC_CODE,
195 			sizeof(SPARC_CODE) - 1,
196 			"Sparc"
197 		},
198 		{
199 			CS_ARCH_SPARC,
200 			(cs_mode)(CS_MODE_BIG_ENDIAN + CS_MODE_V9),
201 			(unsigned char*)SPARCV9_CODE,
202 			sizeof(SPARCV9_CODE) - 1,
203 			"SparcV9"
204 		},
205 		{
206 			CS_ARCH_SYSZ,
207 			(cs_mode)0,
208 			(unsigned char*)SYSZ_CODE,
209 			sizeof(SYSZ_CODE) - 1,
210 			"SystemZ"
211 		},
212 		{
213 			CS_ARCH_XCORE,
214 			(cs_mode)0,
215 			(unsigned char*)XCORE_CODE,
216 			sizeof(XCORE_CODE) - 1,
217 			"XCore"
218 		},
219 	};
220 
221 	csh handle;
222 	uint64_t address = 0x1000;
223 	cs_insn *insn;
224 	int i;
225 	size_t count;
226 	cs_err err;
227 
228 	for (i = 0; i < sizeof(platforms)/sizeof(platforms[0]); i++) {
229 		printf("****************\n");
230 		printf("Platform: %s\n", platforms[i].comment);
231 		err = cs_open(platforms[i].arch, platforms[i].mode, &handle);
232 		if (err) {
233 			printf("Failed on cs_open() with error returned: %u\n", err);
234 			continue;
235 		}
236 
237 		if (platforms[i].opt_type)
238 			cs_option(handle, platforms[i].opt_type, platforms[i].opt_value);
239 
240 		count = cs_disasm(handle, platforms[i].code, platforms[i].size, address, 0, &insn);
241 		if (count) {
242 			size_t j;
243 
244 			print_string_hex(platforms[i].code, platforms[i].size);
245 			printf("Disasm:\n");
246 
247 			for (j = 0; j < count; j++) {
248 				printf("0x%" PRIx64 ":\t%s\t\t%s\n",
249 						insn[j].address, insn[j].mnemonic, insn[j].op_str);
250 			}
251 
252 			// print out the next offset, after the last insn
253 			printf("0x%" PRIx64 ":\n", insn[j-1].address + insn[j-1].size);
254 
255 			// free memory allocated by cs_disasm()
256 			cs_free(insn, count);
257 		} else {
258 			printf("****************\n");
259 			printf("Platform: %s\n", platforms[i].comment);
260 			print_string_hex(platforms[i].code, platforms[i].size);
261 			printf("ERROR: Failed to disasm given code!\n");
262 		}
263 
264 		printf("\n");
265 
266 		cs_close(&handle);
267 	}
268 }
269 
main()270 int main()
271 {
272 	test();
273 
274 #if 0
275 #define offsetof(st, m) __builtin_offsetof(st, m)
276 
277 	cs_insn insn;
278 	printf("size: %lu\n", sizeof(insn));
279 	printf("@id: %lu\n", offsetof(cs_insn, id));
280 	printf("@address: %lu\n", offsetof(cs_insn, address));
281 	printf("@size: %lu\n", offsetof(cs_insn, size));
282 	printf("@bytes: %lu\n", offsetof(cs_insn, bytes));
283 	printf("@mnemonic: %lu\n", offsetof(cs_insn, mnemonic));
284 	printf("@op_str: %lu\n", offsetof(cs_insn, op_str));
285 	printf("@regs_read: %lu\n", offsetof(cs_insn, regs_read));
286 	printf("@regs_read_count: %lu\n", offsetof(cs_insn, regs_read_count));
287 	printf("@regs_write: %lu\n", offsetof(cs_insn, regs_write));
288 	printf("@regs_write_count: %lu\n", offsetof(cs_insn, regs_write_count));
289 	printf("@groups: %lu\n", offsetof(cs_insn, groups));
290 	printf("@groups_count: %lu\n", offsetof(cs_insn, groups_count));
291 	printf("@arch: %lu\n", offsetof(cs_insn, x86));
292 #endif
293 
294 	return 0;
295 }
296