forked from DFHack/df_misc
-
Notifications
You must be signed in to change notification settings - Fork 0
/
scan_nextid_osx.rb
99 lines (88 loc) · 3.66 KB
/
scan_nextid_osx.rb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
require 'metasm'
# metasm script to find all 'job_next_id' 'building_next_id' etc globals in dwarf fortress
# tested in 34.10, osx
# run with ruby -v for debug msgs
$: << File.dirname(__FILE__)
require 'osx_scanxrefs'
# code has pattern:
# push ebp
# push edi
# call get_pc_thunk_ebx
# lea ebp, [ebx+ptr_job_next_id-gotip]
# lea eax, [ebx+a_load_game-gotip]
# mov ecx, [ebp]
# cmp eax, [ecx]
# jl foobar
#
#ptr_job_next_id dd job_next_id
#job_next_id dd 0
#a_load_game_invalid_job_id_number db "Load Game: Invalid Job ID Number, ", 0
puts 'read file' if $VERBOSE
binpath = ARGV.shift || 'dwarfort.exe'
dasm = Metasm::AutoExe.decode_file(binpath).disassembler
puts 'scan "invalid id" strings' if $VERBOSE
strings = {}
dasm.pattern_scan(/Load Game: Invalid (\w|\s)* ID Number/) { |addr|
strings[addr] = dasm.decode_strz(addr)
}
a_jobid = strings.index('Load Game: Invalid Job ID Number, ')
addr = scan_code_xrefs(dasm, a_jobid)[0]
raise 'no Invalid Job ID xref' if not addr
funcstart = nil
0x100.times { |i|
# on linux/windows, the code loops around the xref, so we can simply
# disassemble from the xref. Here on osx, this is not the case, so scan for
# function prologue (4 push reg or more)
if dasm.decode_byte(addr-i) & 0xf0 == 0x50 and
dasm.decode_byte(addr-i+1) & 0xf0 == 0x50 and
dasm.decode_byte(addr-i+2) & 0xf0 == 0x50 and
dasm.decode_byte(addr-i+3) & 0xf0 == 0x50 and
dasm.decode_byte(addr-i-1) & 0xf0 != 0x50 # ensure this is the 1st push
puts 'funcstart %x' % (addr-i) if $VERBOSE
dasm.disassemble_fast(addr-i)
# check we actually get an xref to 'Invalid Job ID'
if getstr = dasm.di_including(addr) and getstr.opcode.name == 'lea'
# find the value of lea's reg arg
a0 = getstr.instruction.args[0].symbolic
bt = dasm.backtrace(a0, getstr.address, :include_start => true)
if bt.length == 1 and bt[0].reduce == a_jobid
# lea loads the address of the Job ID string !
funcstart = addr-i
break
end
end
end
}
puts 'found initIDs function: %x' % funcstart if $VERBOSE
# now we can parse the function, and check for the code pattern
xml = []
dasm.each_function_block(funcstart) { |baddr|
# for every basic bloc ending in a 'jl'
blk = dasm.block_at(baddr)
next if blk.list.last.opcode.name != 'jl'
cmp = blk.list[-2]
raise 'no cmp/jl?' if cmp.opcode.name != 'cmp'
# find the memory pointer used for comparison, this is the nextid value
ptr = cmp.instruction.args[1].symbolic.target
id_addr = dasm.normalize(dasm.backtrace(ptr, cmp.address).first)
# now we assume we have only 2 blocks:
# one with the 2 lea, and it jumps to the block with the jl
# lea nextid_ptr ; lea str ; jmp foo
# foo: cmp reg, [nextid]; jl xx
# now, find the predecessor of the 'jl' block having only 1 successor
strblk = blk.from_normal.find { |fb| dasm.block_at(fb).to_normal.length == 1 }
dasm.block_at(strblk).list.each { |di|
# find all lea reg, [ebx+XX]
next unless di.opcode.name == 'lea' and di.instruction.args[1].b.symbolic == :ebx
# compute the loaded register value
bt = dasm.backtrace(di.instruction.args[0].symbolic, di.address, :include_start => true)
# if it maps to one of the scanned nextID strings, we won
if bt.length == 1 and str = strings[bt[0].reduce]
name = str[/Invalid (.*) ID Number/, 1].downcase.gsub(' ', '_') + '_next_id'
xml << "<global-address name='#{name}' value='0x#{'%08x' % id_addr}'/>"
puts xml.last if $VERBOSE
end
}
}
puts if $VERBOSE
puts xml.sort