-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathgcdsp.py
413 lines (344 loc) · 11.8 KB
/
gcdsp.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
"""
gcdsp.py
~~~~~~~~
An IDAPython processor module for the GC/Wii DSP.
Copyright (C) 2011 Pierre Bourdon <delroth@dolphin-emu.org>
Licensed under the GPLv2 license, see the LICENSE file at the root of this
repository.
"""
from idaapi import *
import os.path
GREETINGS_STRING = """\
GC/Wii DSP processor for IDA (C) 2011 delroth@dolphin-emu.org - \
licensed under the GPLv2 license\
"""
class OpType:
"""Enumeration of the different operand encoding types which can be found
in the GC DSP ISA. From DSPTables.h in Dolphin source code."""
NONE = 0
VAL = 1
IMM = 2
MEM = 3
STR = 4
ADDR_I = 5
ADDR_D = 6
REG = 0x8000
REG04 = REG | 0x0400
REG08 = REG | 0x0800
REG18 = REG | 0x1800
REGM18 = REG18
REG19 = REG | 0x1900
REGM19 = REG19
REG1A = REG | 0x1a80
REG1C = REG | 0x1c00
ACCL = REG | 0x1c00
ACCM = REG | 0x1e00
ACCM_D = REG | 0x1e80
ACC = REG | 0x2000
ACC_D = REG | 0x2080
AX = REG | 0x2200
REGS_MASK = 0x3f80
REF = REG | 0x4000
PRG = REF | REG
# Get autogenerated parts from another file
execfile(os.path.join(os.path.dirname(__file__), 'gcdsp_generated.py'))
class Operand(object):
def __init__(self, type, size, loc, rshift, mask):
self.type = type
self.size = size
self.loc = loc
self.rshift = rshift
self.mask = mask
def parse(self, res, byte1, byte2):
"""Parses informations about the operand from the two instruction
bytes. Code mostly from Dolphin version of DSPTool's disassemble.cpp
file, translated into Python.
Puts return value into `res` (which is an IDA op_t)."""
val = byte1 if not self.loc else byte2
val &= self.mask
if self.rshift < 0:
val <<= -self.rshift
else:
val >>= self.rshift
type = self.type
if type & OpType.REG:
if type in (OpType.ACC_D, OpType.ACCM_D):
val = (~val & 0x1) | ((type & OpType.REGS_MASK) >> 8)
else:
val |= (type & OpType.REGS_MASK) >> 8
type &= ~OpType.REGS_MASK
if type == OpType.REG:
res.type = o_reg
res.dtyp = dt_byte # TODO: fix (ACCs are 40-bit for example)
res.reg = val
elif type == OpType.PRG:
res.type = o_phrase
res.dtyp = dt_byte
res.phrase = val
elif type == OpType.ADDR_I:
res.type = o_near
res.dtyp = dt_byte
res.addr = val
elif type == OpType.ADDR_D:
res.type = o_mem
res.dtyp = dt_byte
res.addr = val
elif type == OpType.IMM:
res.type = o_imm
res.dtyp = dt_byte
res.value = val
elif type == OpType.MEM:
if self.size != 2:
b = val & 0x80
if b:
val |= 0xFF00
res.type = o_mem
res.dtyp = dt_byte
res.addr = val
else:
raise ValueError("unhandled type: %04X" % type)
class Instr(object):
def __init__(self, name, opcode, mask, size, operands=[], ext_operands=[],
stops=False, calls=False, jumps=False, shifts=False,
hll=False):
self.name = name
self.operands = operands
self.ext_operands = ext_operands
self.all_operands = operands + ext_operands
self.all_ops_parsed = [Operand(*o) for o in self.all_operands]
self.stops = stops
self.calls = calls
self.jumps = jumps
self.shifts = shifts
self.hll = hll
self.opcode = opcode
self.mask = mask
self.size = size
def __str__(self):
return "<Instr: %s (%04X & %04X)>" % (self.name, self.opcode,
self.mask)
@property
def flags(self):
ret = 0
for i, operand in enumerate(self.all_operands):
ret |= CF_USE1 << i # TODO: CF_CHG ?
if self.stops:
ret |= CF_STOP
if self.calls:
ret |= CF_CALL
if self.jumps:
ret |= CF_JUMP
if self.shifts:
ret |= CF_SHFT
if self.hll:
ret |= CF_HLL
return ret
class GCDSPProcessor(processor_t):
id = 0x8000 + 5854
flag = PR_ADJSEGS | PRN_HEX | PR_WORD_INS
cnbits = 16
dnbits = 16
psnames = ["gcdsp"]
plnames = ["GC/Wii DSP"]
segreg_size = 0
instruc_start = 0
assembler = {
"flag" : ASH_HEXF3 | ASD_DECF0 | ASO_OCTF1 | ASB_BINF3 | AS_NOTAB
| AS_ASCIIC | AS_ASCIIZ,
"uflag": 0,
"name": "GNU assembler",
"origin": ".org",
"end": "end",
"cmnt": ";",
"ascsep": '"',
"accsep": "'",
"esccodes": "\"'",
"a_ascii": ".ascii",
"a_byte": ".word",
"a_word": ".dword",
"a_bss": "dfs %s",
"a_seg": "seg",
"a_curip": ".",
"a_public": "",
"a_weak": "",
"a_extrn": ".extrn",
"a_comdef": "",
"a_align": ".align",
"lbrace": "(",
"rbrace": ")",
"a_mod": "%",
"a_band": "&",
"a_bor": "|",
"a_xor": "^",
"a_bnot": "~",
"a_shl": "<<",
"a_shr": ">>",
"a_sizeof_fmt": "size %s",
}
reg_names = regNames = ["$%s" % n for n in [
"AR0", "AR1", "AR2", "AR3",
"IX0", "IX1", "IX2", "IX3",
"WR0", "WR1", "WR2", "WR3",
"ST0", "ST1", "ST2", "ST3",
"AC0.H", "AC1.H",
"CR", "SR",
"PROD.L", "PROD.M1", "PROD.H", "PROD.M2",
"AX0.L", "AX1.L", "AX0.H", "AX1.H",
"AC0.L", "AC1.L", "AC0.M", "AC1.M",
"AC0", "AC1",
"AX0", "AX1",
"CS", "DS"
]]
def __init__(self):
processor_t.__init__(self)
self._init_instructions()
self._init_registers()
def _add_instruction(self, instr):
base = instr.opcode & instr.mask
limit = instr.mask ^ 0xFFFF
for opcode in range(base, base + limit + 1):
if (opcode & instr.mask) == instr.opcode:
self.instrs_opcode[opcode] = instr
self.instrs_list.append(instr)
def _init_instructions(self):
"""Setup instructions parameters for IDA."""
self.instrs_opcode = [None] * 0x10000
self.instrs_list = []
for op in opcodes:
stops = op[0] in ("RET", "RTI", "HALT", "JMP", "JMPR")
jumps = op[0].startswith("J")
calls = op[0].startswith("CALL")
instr = Instr(op[0], op[1], op[2], op[3], op[5],
stops=stops, jumps=jumps, calls=calls)
if op[6]: # extended
ext_7bit = (instr.opcode & 0xF000) == 0x3000
for ext in opcodes_ext[1:]: # skip not extended
if ext_7bit and ext[1] >= 0x80:
continue
new_name = instr.name + "'" + ext[0]
new_opcode = instr.opcode | ext[1]
new_mask = instr.mask | ext[2]
xinstr = Instr(new_name, new_opcode, new_mask, instr.size,
instr.operands, ext_operands=ext[5],
stops=stops, jumps=jumps, calls=calls)
self._add_instruction(xinstr)
if ext_7bit:
instr.mask |= 0x7F
else:
instr.mask |= 0xFF
self._add_instruction(instr)
self.instrs_list.append(instr)
self.instruc = [{ "name": i.name, "feature": i.flags }
for i in self.instrs_list]
self.instruc_end = len(self.instruc)
self.instrs = {}
for instr in self.instrs_list:
self.instrs[instr.name] = instr
self.instrs_ids = {}
for i, instr in enumerate(self.instrs_list):
self.instrs_ids[instr.name] = i
instr.id = i
def _init_registers(self):
"""Setup registers index and special register values."""
self.reg_ids = {}
for i, reg in enumerate(self.reg_names):
self.reg_ids[reg] = i
# Simulate fake segment registers
self.regFirstSreg = self.regCodeSreg = self.reg_ids["$CS"]
self.regLastSreg = self.regDataSreg = self.reg_ids["$DS"]
def notify_init(self, idp_file):
"""Called at module initialization."""
cvar.inf.mf = True # set to big endian... wtf
cvar.inf.wide_high_byte_first = True # big endian for 16b bytes too
return True
def notify_endbinary(self, ok):
"""Called when the binary finished loading."""
if ok:
print GREETINGS_STRING
def _read_cmd_byte(self):
ea = self.cmd.ea + self.cmd.size
byte = get_full_byte(ea)
self.cmd.size += 1
return byte
def ana(self):
"""Analyze one instruction and fill the "cmd" instance member."""
cmd = self.cmd
byte1 = self._read_cmd_byte()
instr = self.instrs_opcode[byte1]
if instr is None:
return 0
if instr.size == 2:
byte2 = self._read_cmd_byte()
else:
byte2 = 0
operands = [cmd[i] for i in xrange(6)]
for to_fill in operands:
to_fill.type = o_void
for (to_fill, op) in zip(operands, instr.all_ops_parsed):
op.parse(to_fill, byte1, byte2)
cmd.itype = instr.id
return cmd.size
def _emu_operand(self, op):
"""Emulated using one operand from the instruction."""
if op.type == o_mem:
ua_dodata2(0, op.addr, op.dtyp)
ua_add_dref(0, op.addr, dr_R) # TODO: dr_W ?
elif op.type == o_near:
if self.cmd.get_canon_feature() & CF_CALL:
fl = fl_CN
else:
fl = fl_JN
ua_add_cref(0, op.addr, fl)
def emu(self):
"""Emulate instruction behavior and create x-refs, interpret operand
values, etc."""
instr = self.instrs_list[self.cmd.itype]
for i in xrange(len(instr.all_operands)):
self._emu_operand(self.cmd[i])
if not instr.stops: # add a link to next instr if code continues
ua_add_cref(0, self.cmd.ea + self.cmd.size, fl_F)
return True
def outop(self, op):
"""Generates text representation of an instruction operand."""
if op.type == o_reg:
out_register(self.reg_names[op.reg])
elif op.type == o_phrase:
out_symbol('@')
out_register(self.reg_names[op.reg])
elif op.type == o_imm:
OutValue(op, OOFW_IMM)
elif op.type in [o_near, o_mem]:
ok = out_name_expr(op, op.addr, BADADDR)
if not ok:
out_tagon(COLOR_ERROR)
OutLong(op.addr, 16)
out_tagoff(COLOR_ERROR)
QueueMark(Q_noName, self.cmd.ea)
else:
return False
return True
def out(self):
"""Generates text representation of an instruction in the "cmd" inst
member."""
cmd = self.cmd
buf = init_output_buffer(1024)
OutMnem(15) # max width = 15
instr = self.instrs_list[cmd.itype]
in_extended = False
for i in xrange(0, 6):
if cmd[i].type == o_void:
break
if i != 0:
if not in_extended and i >= len(instr.operands):
in_extended = True
OutChar(' ')
out_symbol(':')
else:
out_symbol(',')
OutChar(' ')
out_one_operand(i)
term_output_buffer()
cvar.gl_comm = 1 # allow comments at end of line
MakeLine(buf)
def PROCESSOR_ENTRY():
return GCDSPProcessor()