Implement basic assembler
This commit is contained in:
parent
ffd1bda725
commit
81039ce304
151
asm.py
Executable file
151
asm.py
Executable file
@ -0,0 +1,151 @@
|
|||||||
|
#!/usr/bin/env python3
|
||||||
|
# synacor.py - An implementation of the Synacor Challenge
|
||||||
|
# Copyright © 2017 RunasSudo
|
||||||
|
#
|
||||||
|
# This program is free software: you can redistribute it and/or modify
|
||||||
|
# it under the terms of the GNU Affero General Public License as published by
|
||||||
|
# the Free Software Foundation, either version 3 of the License, or
|
||||||
|
# (at your option) any later version.
|
||||||
|
#
|
||||||
|
# This program is distributed in the hope that it will be useful,
|
||||||
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
# GNU Affero General Public License for more details.
|
||||||
|
#
|
||||||
|
# You should have received a copy of the GNU Affero General Public License
|
||||||
|
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
|
||||||
|
from libsynacor import *
|
||||||
|
|
||||||
|
import argparse
|
||||||
|
import struct
|
||||||
|
|
||||||
|
parser = argparse.ArgumentParser()
|
||||||
|
parser.add_argument('file', help='.asm file to read')
|
||||||
|
parser.add_argument('output', help='.bin file to write')
|
||||||
|
args = parser.parse_args()
|
||||||
|
|
||||||
|
line_no = 0
|
||||||
|
|
||||||
|
def split_line(line):
|
||||||
|
tokens = []
|
||||||
|
token = ''
|
||||||
|
idx = 0
|
||||||
|
|
||||||
|
in_comment = False
|
||||||
|
in_string = False
|
||||||
|
in_escape = False
|
||||||
|
|
||||||
|
while idx < len(line):
|
||||||
|
if in_comment:
|
||||||
|
pass
|
||||||
|
elif in_string:
|
||||||
|
if in_escape:
|
||||||
|
token += line[idx]
|
||||||
|
else:
|
||||||
|
if line[idx] == '\\':
|
||||||
|
in_escape = True
|
||||||
|
token += line[idx]
|
||||||
|
elif line[idx] == '"':
|
||||||
|
in_string = False
|
||||||
|
token += line[idx]
|
||||||
|
else:
|
||||||
|
token += line[idx]
|
||||||
|
else:
|
||||||
|
if line[idx] == ' ':
|
||||||
|
if token != '':
|
||||||
|
tokens.append(token)
|
||||||
|
token = ''
|
||||||
|
elif line[idx] == '"':
|
||||||
|
in_string = True
|
||||||
|
token += line[idx]
|
||||||
|
elif line[idx] == ';':
|
||||||
|
in_comment = True
|
||||||
|
else:
|
||||||
|
token += line[idx]
|
||||||
|
idx += 1
|
||||||
|
# Final token
|
||||||
|
if token != '':
|
||||||
|
tokens.append(token)
|
||||||
|
|
||||||
|
return tokens
|
||||||
|
|
||||||
|
def unescape_char(char):
|
||||||
|
return char.encode('utf-8').decode('unicode_escape')
|
||||||
|
|
||||||
|
def assemble_next_instruction(source):
|
||||||
|
line = source.readline()
|
||||||
|
global line_no; line_no += 1
|
||||||
|
if line == '':
|
||||||
|
return None, []
|
||||||
|
|
||||||
|
tokens = split_line(line.strip())
|
||||||
|
return assemble_instruction(source, tokens)
|
||||||
|
|
||||||
|
def assemble_instruction(source, tokens):
|
||||||
|
if len(tokens) == 0:
|
||||||
|
return assemble_next_instruction(source)
|
||||||
|
if tokens[0].endswith(':'):
|
||||||
|
# Label
|
||||||
|
label = tokens[0][:-1]
|
||||||
|
instructions, inst_labels = assemble_instruction(source, tokens[1:])
|
||||||
|
return instructions, inst_labels + [label]
|
||||||
|
else:
|
||||||
|
# Instruction
|
||||||
|
name = tokens[0]
|
||||||
|
if name not in instructions_by_name:
|
||||||
|
raise Exception('Unknown instruction {}'.format(name))
|
||||||
|
instruction = instructions_by_name[name]()
|
||||||
|
|
||||||
|
# Special cases
|
||||||
|
if isinstance(instruction, InstructionOut) and tokens[1].startswith('"'):
|
||||||
|
chars = unescape_char(tokens[1][1:-1])
|
||||||
|
instructions = []
|
||||||
|
for char in chars:
|
||||||
|
instruction = InstructionOut()
|
||||||
|
instruction.args.append(OpLiteral(ord(char)))
|
||||||
|
instructions.append(instruction)
|
||||||
|
return instructions, []
|
||||||
|
elif isinstance(instruction, InstructionData):
|
||||||
|
if tokens[1].startswith('"'):
|
||||||
|
chars = unescape_char(tokens[1][1:-1])
|
||||||
|
instruction.args = [ord(char) for char in chars]
|
||||||
|
return [instruction], []
|
||||||
|
else:
|
||||||
|
instruction.args = [int(x, 16) for x in tokens[1:]]
|
||||||
|
return [instruction], []
|
||||||
|
else:
|
||||||
|
if len(tokens) != instruction.nargs + 1:
|
||||||
|
raise Exception('Invalid number of arguments: Expected {}, got {}'.format(instruction.nargs, len(tokens) - 1))
|
||||||
|
for i in range(instruction.nargs):
|
||||||
|
argstr = tokens[i + 1]
|
||||||
|
if argstr.startswith('R'):
|
||||||
|
# Register
|
||||||
|
arg = OpRegister(int(argstr[1:]))
|
||||||
|
else:
|
||||||
|
# Hex literal
|
||||||
|
arg = OpLiteral(int(argstr, 16))
|
||||||
|
instruction.args.append(arg)
|
||||||
|
return [instruction], []
|
||||||
|
|
||||||
|
# TODO: First pass
|
||||||
|
|
||||||
|
# Second pass
|
||||||
|
SYN_MEM = [0] * 32768
|
||||||
|
SYN_PTR = 0
|
||||||
|
|
||||||
|
with open(args.file, 'r') as source:
|
||||||
|
try:
|
||||||
|
while True:
|
||||||
|
instructions, labels = assemble_next_instruction(source)
|
||||||
|
if instructions is None:
|
||||||
|
break
|
||||||
|
for instruction in instructions:
|
||||||
|
code = instruction.assemble()
|
||||||
|
SYN_MEM[SYN_PTR:SYN_PTR+len(code)] = code
|
||||||
|
SYN_PTR += len(code)
|
||||||
|
except Exception as ex:
|
||||||
|
raise Exception('Error at line {}'.format(line_no)) from ex
|
||||||
|
|
||||||
|
with open(args.output, 'wb') as f:
|
||||||
|
f.write(struct.pack('<32768H', *SYN_MEM))
|
10
disasm.py
10
disasm.py
@ -17,13 +17,17 @@
|
|||||||
|
|
||||||
from libsynacor import *
|
from libsynacor import *
|
||||||
|
|
||||||
import sys
|
import argparse
|
||||||
|
|
||||||
with open(sys.argv[1], 'rb') as data:
|
parser = argparse.ArgumentParser()
|
||||||
|
parser.add_argument('file', help='.bin file containing the initial memory dump')
|
||||||
|
args = parser.parse_args()
|
||||||
|
|
||||||
|
with open(args.file, 'rb') as data:
|
||||||
SYN_MEM = memory_from_file(data)
|
SYN_MEM = memory_from_file(data)
|
||||||
|
|
||||||
def escape_char(char):
|
def escape_char(char):
|
||||||
return char.replace('\\', '\\\\').replace('\n', '\\n').replace('"', '\\"')
|
return char.encode('unicode_escape').decode('utf-8').replace('"', '\\"')
|
||||||
|
|
||||||
MODE_OUT = False
|
MODE_OUT = False
|
||||||
MODE_DAT = False #False, 1 (data), 2 (text)
|
MODE_DAT = False #False, 1 (data), 2 (text)
|
||||||
|
@ -33,6 +33,8 @@ class OpLiteral(Operand):
|
|||||||
|
|
||||||
def describe(self):
|
def describe(self):
|
||||||
return '{:04x}'.format(self.value)
|
return '{:04x}'.format(self.value)
|
||||||
|
def assemble(self):
|
||||||
|
return self.value
|
||||||
|
|
||||||
class OpRegister(Operand):
|
class OpRegister(Operand):
|
||||||
def __init__(self, register):
|
def __init__(self, register):
|
||||||
@ -44,6 +46,8 @@ class OpRegister(Operand):
|
|||||||
|
|
||||||
def describe(self):
|
def describe(self):
|
||||||
return 'R{}'.format(self.register)
|
return 'R{}'.format(self.register)
|
||||||
|
def assemble(self):
|
||||||
|
return self.register + 32768
|
||||||
|
|
||||||
instructions_by_opcode = {}
|
instructions_by_opcode = {}
|
||||||
instructions_by_name = {}
|
instructions_by_name = {}
|
||||||
@ -70,6 +74,9 @@ class Instruction:
|
|||||||
description += ' {}'.format(self.args[i].describe())
|
description += ' {}'.format(self.args[i].describe())
|
||||||
return description
|
return description
|
||||||
|
|
||||||
|
def assemble(self):
|
||||||
|
return [self.opcode] + [self.args[i].assemble() for i in range(self.nargs)]
|
||||||
|
|
||||||
@staticmethod
|
@staticmethod
|
||||||
def next_instruction(data, idx):
|
def next_instruction(data, idx):
|
||||||
opcode = Operand.read_op(data[idx])
|
opcode = Operand.read_op(data[idx])
|
||||||
@ -217,3 +224,10 @@ class InstructionIn(Instruction):
|
|||||||
cpu.SYN_STDIN_BUF = list(line)
|
cpu.SYN_STDIN_BUF = list(line)
|
||||||
|
|
||||||
self.args[0].set(cpu, ord(cpu.SYN_STDIN_BUF.pop(0)))
|
self.args[0].set(cpu, ord(cpu.SYN_STDIN_BUF.pop(0)))
|
||||||
|
|
||||||
|
# Not actually an instruction, but convenient to think of it as one for the purposes of assembling
|
||||||
|
# self.args is an array of literal values, rather than Operands
|
||||||
|
class InstructionData(Instruction):
|
||||||
|
def assemble(self):
|
||||||
|
return self.args
|
||||||
|
instructions_by_name['data'] = InstructionData
|
||||||
|
Reference in New Issue
Block a user