import os, re from proc import proc import lex import op class parser: def __init__(self): self.strip_path = 0 self.__globals = {} self.__offsets = {} self.__stack = [] self.proc = None self.proc_list = [] self.binary_data = [] self.symbols = [] self.link_later = [] def visible(self): for i in self.__stack: if not i or i == 0: return False return True def push_if(self, text): value = self.eval(text) #print "if %s -> %s" %(text, value) self.__stack.append(value) def push_else(self): #print "else" self.__stack[-1] = not self.__stack[-1] def pop_if(self): #print "endif" return self.__stack.pop() def set_global(self, name, value): if len(name) == 0: raise Exception("empty name is not allowed") name = name.lower() #print "adding global %s -> %s" %(name, value) if self.__globals.has_key(name): raise Exception("global %s was already defined", name) self.__globals[name] = value def get_global(self, name): name = name.lower() return self.__globals[name] def has_global(self, name): name = name.lower() return self.__globals.has_key(name) def set_offset(self, name, value): if len(name) == 0: raise Exception("empty name is not allowed") name = name.lower() #print "adding global %s -> %s" %(name, value) if self.__offsets.has_key(name): raise Exception("global %s was already defined", name) self.__offsets[name] = value def get_offset(self, name): name = name.lower() return self.__offsets[name] def get_offsets(self): return self.__offsets def include(self, basedir, fname): path = fname.split('\\')[self.strip_path:] path = os.path.join(basedir, os.path.pathsep.join(path)) #print "including %s" %(path) self.parse(path) def eval(self, stmt): try: return self.parse_int(stmt) except: pass value = self.__globals[stmt.lower()].value return int(value) def expr_callback(self, match): name = match.group(1).lower() g = self.get_global(name) if isinstance(g, op.const): return g.value else: return "0x%04x" %g.offset def eval_expr(self, expr): n = 1 while n > 0: expr, n = re.subn(r'\b([a-zA-Z_]+[a-zA-Z0-9_]*)', self.expr_callback, expr) return eval(expr) def expand_globals(self, text): return text def fix_dollar(self, v): return re.sub(r'\$', "%d" %len(self.binary_data), v) def parse_int(self, v): if re.match(r'[01]+b$', v): v = int(v[:-1], 2) if re.match(r'[\+-]?[0-9a-f]+h$', v): v = int(v[:-1], 16) return int(v) def compact_data(self, width, data): #print "COMPACTING %d %s" %(width, data) r = [] base = 0x100 if width == 1 else 0x10000 for v in data: if v[0] == '"': if v[-1] != '"': raise Exception("invalid string %s" %v) if width == 2: raise Exception("string with data width more than 1") #we could allow it :) for i in xrange(1, len(v) - 1): r.append(ord(v[i])) continue m = re.match(r'(\w+)\s+dup\s+\((\s*\S+\s*)\)', v) if m is not None: #we should parse that n = self.parse_int(m.group(1)) if m.group(2) != '?': value = self.parse_int(m.group(2)) else: value = 0 for i in xrange(0, n): v = value for b in xrange(0, width): r.append(v & 0xff); v >>= 8 continue try: v = self.parse_int(v) if v < 0: v += base except: #global name print "global/expr: %s" %v try: g = self.get_global(v) v = g.offset except: print "unknown address %s" %(v) self.link_later.append((len(self.binary_data) + len(r), v)) v = 0 for b in xrange(0, width): r.append(v & 0xff); v >>= 8 #print r return r def parse(self, fname): # print "opening file %s..." %(fname, basedir) fd = open(fname, 'rb') for line in fd: line = line.strip() if len(line) == 0 or line[0] == ';' or line[0] == chr(0x1a): continue #print cmd m = re.match('(\w+)\s*?:', line) if m is not None: line = line[len(m.group(0)):] if self.visible(): name = m.group(1) if self.proc is not None: self.proc.add_label(name) self.set_offset(name, (len(self.binary_data), self.proc, len(self.proc.stmts) if self.proc is not None else 0)) cmd = line.split() if len(cmd) == 0: continue cmd0 = str(cmd[0]) if cmd0 == 'if': self.push_if(cmd[1]) continue elif cmd0 == 'else': self.push_else() continue elif cmd0 == 'endif': self.pop_if() continue if not self.visible(): continue if cmd0 == 'db' or cmd0 == 'dw' or cmd0 == 'dd': arg = " ".join(cmd[1:]) binary_width = {'b': 1, 'w': 2, 'd': 4}[cmd0[1]] self.binary_data += self.compact_data(binary_width, lex.parse_args(arg)) continue elif cmd0 == 'include': self.include(os.path.dirname(fname), cmd[1]) continue elif cmd0 == 'endp': self.proc = None continue elif cmd0 == 'assume': print "skipping: %s" %line continue elif cmd0 == 'rep': self.proc.add(cmd0) self.proc.add(" ".join(cmd[1:])) continue if len(cmd) >= 3: cmd1 = cmd[1] if cmd1 == 'equ': v = cmd[2] self.set_global(cmd0, op.const(self.fix_dollar(v))) elif cmd1 == 'db' or cmd1 == 'dw' or cmd1 == 'dd': binary_width = {'b': 1, 'w': 2, 'd': 4}[cmd1[1]] self.binary_data += self.compact_data(binary_width, lex.parse_args(" ".join(cmd[2:]))) self.set_global(cmd0.lower(), op.var(binary_width, len(self.binary_data))) continue elif cmd1 == 'proc': name = cmd0.lower() self.proc = proc(name) print "procedure %s, #%d" %(name, len(self.proc_list)) self.proc_list.append(name) self.set_global(name, self.proc) continue if (self.proc): self.proc.add(line) else: #print line pass fd.close() return self def link(self): for addr, expr in self.link_later: v = self.eval_expr(expr) print "link: patching %04x -> %04x" %(addr, v) while v != 0: self.binary_data[addr] = v & 0xff addr += 1 v >>= 8