rubyx/lib/register/assembler.rb

228 lines
7.5 KiB
Ruby
Raw Normal View History

module Register
2014-08-29 20:00:25 +02:00
# Assmble the object space into a binary.
# Link first to get positions, then assemble
# link and assemble functions for each class are close to each other, so to get them the same.
# meaning: as the link function determines the length of an object and the assemble actually writes the bytes
# they are pretty much dependant. In an earlier version they were functions on the objects, but now it
# has gone to a visitor pattern.
class Assembler
2014-09-09 12:28:07 +02:00
TYPE_REF = 0
TYPE_INT = 1
TYPE_BITS = 4
TYPE_LENGTH = 6
def initialize space
@space = space
@objects = {}
end
attr_reader :objects
def link
add_object(@space)
at = 4 # first jump instruction
# then all functions
@objects.each_value do | objekt|
next unless objekt.is_a? Virtual::CompiledMethod
objekt.set_position(at)
at += objekt.mem_length
end
#and then all data object
@objects.each_value do | objekt|
next if objekt.is_a? Virtual::CompiledMethod
objekt.set_position at
at += objekt.mem_length
end
end
2014-08-26 21:35:56 +02:00
def assemble
link
@stream = StringIO.new
mid , main = @objects.find{|k,objekt| objekt.is_a?(Virtual::CompiledMethod) and (objekt.name == :__init__ )}
2014-09-11 09:30:23 +02:00
puts "function found #{main.name}"
initial_jump = RegisterMachine.instance.b( main )
initial_jump.set_position( 0)
initial_jump.assemble( @stream )
@objects.each_value do |objekt|
next unless objekt.is_a? Virtual::CompiledMethod
assemble_object( objekt )
end
@objects.each_value do | objekt|
next if objekt.is_a? Virtual::CompiledMethod
assemble_object( objekt )
end
2014-09-05 19:56:05 +02:00
puts "Assembled #{@stream.length.to_s(16)}"
2014-08-30 13:01:22 +02:00
return @stream.string
2014-08-26 21:35:56 +02:00
end
def assemble_object obj
puts "Assemble #{obj.class}(#{obj.object_id}) at stream #{(@stream.length).to_s(16)} pos:#{obj.position.to_s(16)} , len:#{obj.mem_length}"
raise "Assemble #{obj.class} at #{@stream.length.to_s(16)} not #{obj.position.to_s(16)}" if @stream.length != obj.position
clazz = obj.class.name.split("::").last
send("assemble_#{clazz}".to_sym , obj)
obj.position
2014-08-29 14:49:59 +02:00
end
2014-09-09 12:28:07 +02:00
def type_word array
word = 0
array.each_with_index do |var , index|
type = (var.class == Integer) ? TYPE_INT : TYPE_REF
word += type << (index * TYPE_BITS)
end
word += ( (array.length + 1 ) / 8 ) << TYPE_LENGTH * TYPE_BITS
word
end
2014-08-29 20:00:25 +02:00
# write type and layout of the instance, and the variables that are passed
# variables ar values, ie int or refs. For refs the object needs to save the object first
def assemble_self( object , variables )
raise "Object(#{object.object_id}) not linked #{object.inspect}" unless @objects[object.object_id]
2014-09-09 12:28:07 +02:00
type = type_word(variables)
@stream.write_uint32( type )
write_ref_for(object.layout[:names] , object )
2014-08-29 20:00:25 +02:00
variables.each do |var|
write_ref_for(var , object)
2014-08-26 21:35:56 +02:00
end
pad_after( variables.length * 4 )
object.position
2014-08-29 14:49:59 +02:00
end
def assemble_Array array
2014-09-09 12:28:07 +02:00
type = type_word(array)
@stream.write_uint32( type )
write_ref_for(layout[:names],array) #ref
2014-08-29 20:00:25 +02:00
array.each do |var|
write_ref_for(var,array)
2014-08-29 20:00:25 +02:00
end
pad_after( array.length * 4 )
array.position
end
def assemble_Hash hash
# so here we can be sure to have _identical_ keys/values arrays
assemble_self( hash , [ hash.layout[:keys] , hash.layout[:values] ] )
2014-08-26 21:35:56 +02:00
end
def assemble_BootSpace(space)
2014-08-29 20:00:25 +02:00
assemble_self(space , [space.classes,space.objects] )
2014-08-29 14:49:59 +02:00
end
def assemble_BootClass(clazz)
assemble_self( clazz , [clazz.name , clazz.super_class_name, clazz.instance_methods] )
2014-08-26 21:35:56 +02:00
end
def assemble_CompiledMethod(method)
2014-09-09 12:28:07 +02:00
count = method.blocks.inject(0) { |c , block| c += block.length }
word = (count+7) / 32 # all object are multiple of 8 words (7 for header)
raise "Method too long, splitting not implemented #{method.name}/#{count}" if word > 15
# first line is integers, convention is that following lines are the same
TYPE_LENGTH.times { word = ((word << TYPE_BITS) + TYPE_INT) }
@stream.write_uint32( word )
write_ref_for(method.layout[:names] , method) #ref of layout
# TODO the assembly may have to move to the object to be more extensible
2014-08-26 21:35:56 +02:00
method.blocks.each do |block|
2014-08-29 20:00:25 +02:00
block.codes.each do |code|
code.assemble( @stream )
2014-08-29 20:00:25 +02:00
end
2014-08-26 21:35:56 +02:00
end
pad_after( count )
2014-08-26 21:35:56 +02:00
end
def assemble_String( str )
2014-09-05 19:56:05 +02:00
str = str.string if str.is_a? Virtual::StringConstant
str = str.to_s if str.is_a? Symbol
word = (str.mem_length + 7) / 32 # all object are multiple of 8 words (7 for header)
2014-09-09 12:28:07 +02:00
raise "String too long (implement split string!) #{word}" if word > 15
# first line is integers, convention is that following lines are the same
TYPE_LENGTH.times { word = ((word << TYPE_BITS) + TYPE_INT) }
@stream.write_uint32( word )
write_ref_for( str.layout[:names] , slot) #ref
2014-08-26 21:35:56 +02:00
@stream.write str
pad_after(str.mem_length)
#puts "String (#{slot.mem_length}) stream #{@stream.mem_length.to_s(16)}"
2014-08-26 21:35:56 +02:00
end
def assemble_Symbol(sym)
2014-08-30 13:01:22 +02:00
return assemble_String(sym)
2014-08-26 21:35:56 +02:00
end
def assemble_StringConstant( sc)
2014-08-30 13:01:22 +02:00
return assemble_String(sc)
2014-08-26 21:35:56 +02:00
end
2014-08-29 20:00:25 +02:00
def add_object(object)
return if @objects[object.object_id]
@objects[object.object_id] = object
add_object(object.layout[:names])
clazz = object.class.name.split("::").last
send("add_#{clazz}".to_sym , object)
2014-09-16 10:39:08 +02:00
end
def add_Array( array )
# also array has constant overhead, the padded helper fixes it to multiple of 8
array.each do |elem|
add_object(elem)
end
end
def add_Hash( hash )
add_object(hash.keys)
add_object(hash.values)
end
def add_BootSpace(space)
add_object(space.classes)
add_object(space.objects)
end
def add_BootClass(clazz)
add_object(clazz.name )
add_object(clazz.super_class_name)
add_object(clazz.instance_methods)
end
def add_CompiledMethod(method)
end
def add_String( str)
end
def add_Symbol(sym)
end
def add_StringConstant(sc)
end
2014-08-29 20:00:25 +02:00
private
2014-09-06 22:03:33 +02:00
# write means we write the resulting address straight into the assembler stream (ie don't return it)
# object means the object of which we write the address
2014-09-06 22:03:33 +02:00
# and we write the address into the self, given as second parameter
def write_ref_for object , self_ref
raise "Object (#{object.object_id}) not linked #{object.inspect}" unless slot
@stream.write_sint32 object.position
2014-08-29 20:00:25 +02:00
end
# objects only come in lengths of multiple of 8 words
# but there is a constant overhead of 2 words, one for type, one for layout
# and as we would have to subtract 1 to make it work without overhead, we now have to add 7
2014-08-29 20:00:25 +02:00
def padded len
a = 32 * (1 + (len + 7)/32 )
2014-09-09 12:28:07 +02:00
#puts "#{a} for #{len}"
a
2014-08-29 20:00:25 +02:00
end
def padded_words words
padded(words*4) # 4 == word length, a constant waiting for a home
end
# pad_after is always in bytes and pads (writes 0's) up to the next 8 word boundary
def pad_after length
2014-09-10 20:43:05 +02:00
pad = padded(length) - length - 8 # for header, type and layout
2014-09-05 19:56:05 +02:00
pad.times do
@stream.write_uint8(0)
2014-09-05 19:56:05 +02:00
end
#puts "padded #{length} with #{pad} stream pos #{@stream.mem_length.to_s(16)}"
2014-09-05 19:56:05 +02:00
end
end
2014-08-26 10:50:43 +02:00
Sof::Volotile.add(Register::Assembler , [:objects])
end