rubyx/lib/parfait/word.rb



module Parfait
  # A word is a a short sequence of characters
  # Characters are not modeled as objects but as (small) integers
  # The small means two of them have to fit into a machine word, utf16 or similar
  #
  # Words are constant, maybe like js strings, ruby symbols
  # Words are short, but may have spaces

  # Words are objects, that means they carry Type as index 0
  # So all indexes are offset by one in the implementation
  # Object length is measured in non-type cells though

  class Word < Data8
    attr :type, :char_length

    def self.type_length
      2    # 0 type , 1 char_length
    end
    def self.get_length_index
      type_length - 1
    end
    # initialize with length. For now we try to keep all non-parfait (including String) out
    # String will contain spaces for non-zero length
    # Risc provides methods to create Parfait objects from ruby
    def initialize( len )
      super()
      self.char_length = 0
      raise "Must init with int, not #{len.class}" unless len.kind_of? ::Integer
      raise "Must init with positive, not #{len}" if len < 0
      set_length( len , 32 ) unless len == 0 #32 being ascii space
      #puts "type #{self.get_type} #{self.object_id.to_s(16)}"
    end


    # return a copy of self
    def copy
      cop = Word.new( self.length )
      index = 0
      while( index < self.length )
        cop.set_char(index , self.get_char(index))
        index = index + 1
      end
      cop
    end

    # return the number of characters
    def length()
      obj_len = char_length
      return obj_len
    end

    # make every char equal the given one
    def fill_with( char )
      fill_from_with(0 , char)
    end

    def fill_from_with( from , char )
      len = self.length()
      return if from < 0
      while( from < len)
        set_char( from , char)
        from = from + 1
      end
      from
    end

    # true if no characters
    def empty?
      return self.length == 0
    end

    # pad the string with the given character to the given length
    #
    def set_length(len , fill_char)
      return if len <= 0
      old = char_length
      return if old >= len
      self.char_length = len
      check_length
      fill_from_with( old + 1 , fill_char )
    end

    # set the character at the given index to the given character
    # character must be an integer, as is the index
    # the index starts at one, but may be negative to count from the end
    # indexes out of range will raise an error
    def set_char( at , char )
      raise "char not fixnum #{char.class}" unless char.kind_of? ::Integer
      index = range_correct_index(at)
      set_internal_byte( index , char)
    end

    def set_internal_byte( index , char )
      word_index = (index) / 4
      rest = ((index) % 4)
      shifted =  char << (rest * 8)
      was = get_internal_word( word_index )
      was = 0 unless was.is_a?(Numeric)
      mask = 0xFF << (rest * 8)
      mask = 0xFFFFFFFF - mask
      masked = was & mask
      put = masked + shifted
      set_internal_word( word_index , put )
      msg = "set index=#{index} word_index=#{word_index} rest=#{rest}= "
      msg += "char=#{char.to_s(16)} shifted=#{shifted.to_s(16)} "
      msg += "was=#{was.to_s(16)} masked=#{masked.to_s(16)} put=#{put.to_s(16)}"
      #puts msg
      char
    end

    # get the character at the given index (lowest 1)
    # the index starts at one, but may be negative to count from the end
    # indexes out of range will raise an error
    #the return "character" is an integer
    def get_char( at )
      index = range_correct_index(at)
      get_internal_byte(index)
    end


    def get_internal_byte( index )
      word_index = (index ) / 4
      rest = ((index) % 4)
      char = get_internal_word(word_index)
      char = 0 unless char.is_a?(Numeric)
      shifted = char >> (8 * rest)
      ret = shifted & 0xFF
      msg = "get index=#{index} word_index=#{word_index} rest=#{rest}= "
      msg += " char=#{char.to_s(16)} shifted=#{shifted.to_s(16)}  ret=#{ret.to_s(16)}"
      #puts msg
      return ret
    end

    # private method to account for
    def range_correct_index( at )
      index = at
#      index = self.length + at if at < 0
      raise "index not integer #{at.class}" unless at.is_a?(::Integer)
      raise "index must be positive , not #{at}" if (index < 0)
      raise "index too large #{at} > #{self.length}" if (index >= self.length )
      return index + 11
    end

    # compare the word to another
    # currently checks for same class, though really identity of the characters
    # in right order would suffice
    def compare( other )
      return false if other.class != self.class
      return false if other.length != self.length
      len = self.length - 1
      while(len >= 0)
        return false if self.get_char(len) != other.get_char(len)
        len = len - 1
      end
      return true
    end

    def == other
      return false unless other.is_a?(String) or other.is_a?(Word)
      as_string = self.to_string
      unless other.is_a? String
        other = other.to_string
      end
      as_string == other
    end

    def to_string
      string = ""
      index = 0
      while( index < char_length)
        char = get_char(index)
        string += char ? char.chr : "*"
        index = index + 1
      end
      string
    end

    # as we answered is_value? with true, rfx will create a basic node with this string
    def to_rfx
      "'" + to_s + "'"
    end

    def padded_length
      Padding.padded( 4 * get_type().instance_length + char_length  )
    end

    private
    def check_length
      raise "Length out of bounds #{char_length}" if char_length > 1000
    end
  end

end
rename string to word 2015-05-13 15:06:38 +02:00

			`module Parfait`
			`# A word is a a short sequence of characters`
			`# Characters are not modeled as objects but as (small) integers`
also giving word it's length still hacked as char per word, but should be easy enough to fix when… 2015-10-26 11:23:52 +01:00			`# The small means two of them have to fit into a machine word, utf16 or similar`
rename string to word 2015-05-13 15:06:38 +02:00			`#`
			`# Words are constant, maybe like js strings, ruby symbols`
			`# Words are short, but may have spaces`
fix word implementation and tests much better, though wasteful implementation breaks a few tests, but ploughing on first 2015-05-15 15:45:36 +02:00
fix docs for rename 2016-02-25 21:03:11 +01:00			`# Words are objects, that means they carry Type as index 0`
rename old layout() new is called get_layout, but keep old around for checking 2015-05-17 13:41:18 +02:00			`# So all indexes are offset by one in the implementation`
rename layout to type this one goes to caleb for pointing it out. Much better word 2016-02-25 20:50:10 +01:00			`# Object length is measured in non-type cells though`
rename old layout() new is called get_layout, but keep old around for checking 2015-05-17 13:41:18 +02:00
add data objects marker class (may change) to be able to check access 2018-03-25 17:22:02 +02:00			`class Word < Data8`
make all instances attr read writers unfortunately the writers have to have self.var = otherwise it is just a local var Also need to make the type explicit for all Protocol included memory_length on the class for now 2018-08-11 18:15:34 +02:00			`attr :type, :char_length`
also giving word it's length still hacked as char per word, but should be easy enough to fix when… 2015-10-26 11:23:52 +01:00
use fake memory fix integer offset bug (which only didn’t cause errors as fixnums are still an order too big and the famous +1 error hit the empty space) 2018-05-28 14:09:59 +02:00			`def self.type_length`
			`2 # 0 type , 1 char_length`
			`end`
finally change List to derive from data object can’t derive from data16 as some lists are longer have to get the delegation to work first 2018-05-28 14:45:29 +02:00			`def self.get_length_index`
			`type_length - 1`
temporary word hack to make it look liked indexed 2015-11-09 22:28:40 +01:00			`end`
basic word functionality and conversion from string 2015-05-14 19:39:12 +02:00			`# initialize with length. For now we try to keep all non-parfait (including String) out`
copy and other improvements for word more tests reveal a bug (fixed) and more docs 2015-05-20 12:50:25 +02:00			`# String will contain spaces for non-zero length`
rename register to risc seems to fit the layer much better as we really have a very reduced instruction set 2017-01-19 08:02:29 +01:00			`# Risc provides methods to create Parfait objects from ruby`
switch to 0 based indexing the world rocked for a moment (and more fixes to follow) also the crumbling of idealism was heard 2018-05-14 10:55:01 +02:00			`def initialize( len )`
fix word implementation and tests much better, though wasteful implementation breaks a few tests, but ploughing on first 2015-05-15 15:45:36 +02:00			`super()`
make all instances attr read writers unfortunately the writers have to have self.var = otherwise it is just a local var Also need to make the type explicit for all Protocol included memory_length on the class for now 2018-08-11 18:15:34 +02:00			`self.char_length = 0`
close #21 Mostly replaced Fixnum with integer also in the rx-file dependency all travis and testing with 2.4+ 2019-02-07 17:24:35 +01:00			`raise "Must init with int, not #{len.class}" unless len.kind_of? ::Integer`
fix word implementation and tests much better, though wasteful implementation breaks a few tests, but ploughing on first 2015-05-15 15:45:36 +02:00			`raise "Must init with positive, not #{len}" if len < 0`
switch to 0 based indexing the world rocked for a moment (and more fixes to follow) also the crumbling of idealism was heard 2018-05-14 10:55:01 +02:00			`set_length( len , 32 ) unless len == 0 #32 being ascii space`
rename layout to type this one goes to caleb for pointing it out. Much better word 2016-02-25 20:50:10 +01:00			`#puts "type #{self.get_type} #{self.object_id.to_s(16)}"`
fix word implementation and tests much better, though wasteful implementation breaks a few tests, but ploughing on first 2015-05-15 15:45:36 +02:00			`end`

removing the fake memory form object just in word and list now 2016-12-29 17:49:03 +01:00
copy and other improvements for word more tests reveal a bug (fixed) and more docs 2015-05-20 12:50:25 +02:00			`# return a copy of self`
			`def copy`
			`cop = Word.new( self.length )`
switch to 0 based indexing the world rocked for a moment (and more fixes to follow) also the crumbling of idealism was heard 2018-05-14 10:55:01 +02:00			`index = 0`
			`while( index < self.length )`
copy and other improvements for word more tests reveal a bug (fixed) and more docs 2015-05-20 12:50:25 +02:00			`cop.set_char(index , self.get_char(index))`
			`index = index + 1`
			`end`
			`cop`
			`end`

			`# return the number of characters`
fix word implementation and tests much better, though wasteful implementation breaks a few tests, but ploughing on first 2015-05-15 15:45:36 +02:00			`def length()`
make all instances attr read writers unfortunately the writers have to have self.var = otherwise it is just a local var Also need to make the type explicit for all Protocol included memory_length on the class for now 2018-08-11 18:15:34 +02:00			`obj_len = char_length`
fix word implementation and tests much better, though wasteful implementation breaks a few tests, but ploughing on first 2015-05-15 15:45:36 +02:00			`return obj_len`
basic word functionality and conversion from string 2015-05-14 19:39:12 +02:00			`end`

get binary code to work 2015-05-28 20:10:27 +02:00			`# make every char equal the given one`
switch to 0 based indexing the world rocked for a moment (and more fixes to follow) also the crumbling of idealism was heard 2018-05-14 10:55:01 +02:00			`def fill_with( char )`
get binary code to work 2015-05-28 20:10:27 +02:00			`fill_from_with(0 , char)`
			`end`

switch to 0 based indexing the world rocked for a moment (and more fixes to follow) also the crumbling of idealism was heard 2018-05-14 10:55:01 +02:00			`def fill_from_with( from , char )`
get binary code to work 2015-05-28 20:10:27 +02:00			`len = self.length()`
switch to 0 based indexing the world rocked for a moment (and more fixes to follow) also the crumbling of idealism was heard 2018-05-14 10:55:01 +02:00			`return if from < 0`
			`while( from < len)`
get binary code to work 2015-05-28 20:10:27 +02:00			`set_char( from , char)`
			`from = from + 1`
			`end`
			`from`
			`end`

copy and other improvements for word more tests reveal a bug (fixed) and more docs 2015-05-20 12:50:25 +02:00			`# true if no characters`
fix word implementation and tests much better, though wasteful implementation breaks a few tests, but ploughing on first 2015-05-15 15:45:36 +02:00			`def empty?`
			`return self.length == 0`
			`end`
basic word functionality and conversion from string 2015-05-14 19:39:12 +02:00
copy and other improvements for word more tests reveal a bug (fixed) and more docs 2015-05-20 12:50:25 +02:00			`# pad the string with the given character to the given length`
			`#`
basic word functionality and conversion from string 2015-05-14 19:39:12 +02:00			`def set_length(len , fill_char)`
final word fix that does the parfait 2015-05-17 14:34:45 +02:00			`return if len <= 0`
make all instances attr read writers unfortunately the writers have to have self.var = otherwise it is just a local var Also need to make the type explicit for all Protocol included memory_length on the class for now 2018-08-11 18:15:34 +02:00			`old = char_length`
also giving word it's length still hacked as char per word, but should be easy enough to fix when… 2015-10-26 11:23:52 +01:00			`return if old >= len`
make all instances attr read writers unfortunately the writers have to have self.var = otherwise it is just a local var Also need to make the type explicit for all Protocol included memory_length on the class for now 2018-08-11 18:15:34 +02:00			`self.char_length = len`
also giving word it's length still hacked as char per word, but should be easy enough to fix when… 2015-10-26 11:23:52 +01:00			`check_length`
			`fill_from_with( old + 1 , fill_char )`
basic word functionality and conversion from string 2015-05-14 19:39:12 +02:00			`end`

copy and other improvements for word more tests reveal a bug (fixed) and more docs 2015-05-20 12:50:25 +02:00			`# set the character at the given index to the given character`
			`# character must be an integer, as is the index`
			`# the index starts at one, but may be negative to count from the end`
			`# indexes out of range will raise an error`
add data objects marker class (may change) to be able to check access 2018-03-25 17:22:02 +02:00			`def set_char( at , char )`
close #21 Mostly replaced Fixnum with integer also in the rx-file dependency all travis and testing with 2.4+ 2019-02-07 17:24:35 +01:00			`raise "char not fixnum #{char.class}" unless char.kind_of? ::Integer`
basic word functionality and conversion from string 2015-05-14 19:39:12 +02:00			`index = range_correct_index(at)`
making parfait (both) use the new byte functions 2015-11-19 09:09:24 +01:00			`set_internal_byte( index , char)`
			`end`

add data objects marker class (may change) to be able to check access 2018-03-25 17:22:02 +02:00			`def set_internal_byte( index , char )`
fix both parfait words to have same indexing 2015-11-20 12:25:49 +01:00			`word_index = (index) / 4`
			`rest = ((index) % 4)`
make ruby word byte size was hacked as int interestingly zero change to tests 2015-11-11 18:11:08 +01:00			`shifted = char << (rest * 8)`
rename get/set internal to _word , because _byte versions are coming 2015-11-18 14:36:43 +01:00			`was = get_internal_word( word_index )`
make ruby word byte size was hacked as int interestingly zero change to tests 2015-11-11 18:11:08 +01:00			`was = 0 unless was.is_a?(Numeric)`
implement byte access for some word wouldn’t have been possible without the ruby version 2015-11-11 19:36:07 +01:00			`mask = 0xFF << (rest * 8)`
			`mask = 0xFFFFFFFF - mask`
			`masked = was & mask`
make ruby word byte size was hacked as int interestingly zero change to tests 2015-11-11 18:11:08 +01:00			`put = masked + shifted`
rename get/set internal to _word , because _byte versions are coming 2015-11-18 14:36:43 +01:00			`set_internal_word( word_index , put )`
make ruby word byte size was hacked as int interestingly zero change to tests 2015-11-11 18:11:08 +01:00			`msg = "set index=#{index} word_index=#{word_index} rest=#{rest}= "`
			`msg += "char=#{char.to_s(16)} shifted=#{shifted.to_s(16)} "`
			`msg += "was=#{was.to_s(16)} masked=#{masked.to_s(16)} put=#{put.to_s(16)}"`
			`#puts msg`
			`char`
moving string to parfait using parfait::word also rename builtins string to word 2015-05-13 15:17:10 +02:00			`end`

make ruby word byte size was hacked as int interestingly zero change to tests 2015-11-11 18:11:08 +01:00			`# get the character at the given index (lowest 1)`
copy and other improvements for word more tests reveal a bug (fixed) and more docs 2015-05-20 12:50:25 +02:00			`# the index starts at one, but may be negative to count from the end`
			`# indexes out of range will raise an error`
			`#the return "character" is an integer`
add data objects marker class (may change) to be able to check access 2018-03-25 17:22:02 +02:00			`def get_char( at )`
basic word functionality and conversion from string 2015-05-14 19:39:12 +02:00			`index = range_correct_index(at)`
making parfait (both) use the new byte functions 2015-11-19 09:09:24 +01:00			`get_internal_byte(index)`
			`end`


			`def get_internal_byte( index )`
fix both parfait words to have same indexing 2015-11-20 12:25:49 +01:00			`word_index = (index ) / 4`
			`rest = ((index) % 4)`
rename get/set internal to _word , because _byte versions are coming 2015-11-18 14:36:43 +01:00			`char = get_internal_word(word_index)`
make ruby word byte size was hacked as int interestingly zero change to tests 2015-11-11 18:11:08 +01:00			`char = 0 unless char.is_a?(Numeric)`
			`shifted = char >> (8 * rest)`
			`ret = shifted & 0xFF`
			`msg = "get index=#{index} word_index=#{word_index} rest=#{rest}= "`
			`msg += " char=#{char.to_s(16)} shifted=#{shifted.to_s(16)} ret=#{ret.to_s(16)}"`
			`#puts msg`
			`return ret`
basic word functionality and conversion from string 2015-05-14 19:39:12 +02:00			`end`

switch to 0 based indexing the world rocked for a moment (and more fixes to follow) also the crumbling of idealism was heard 2018-05-14 10:55:01 +02:00			`# private method to account for`
			`def range_correct_index( at )`
basic word functionality and conversion from string 2015-05-14 19:39:12 +02:00			`index = at`
fix both parfait words to have same indexing 2015-11-20 12:25:49 +01:00			`# index = self.length + at if at < 0`
close #21 Mostly replaced Fixnum with integer also in the rx-file dependency all travis and testing with 2.4+ 2019-02-07 17:24:35 +01:00			`raise "index not integer #{at.class}" unless at.is_a?(::Integer)`
switch to 0 based indexing the world rocked for a moment (and more fixes to follow) also the crumbling of idealism was heard 2018-05-14 10:55:01 +02:00			`raise "index must be positive , not #{at}" if (index < 0)`
			`raise "index too large #{at} > #{self.length}" if (index >= self.length )`
fix both parfait words to have same indexing 2015-11-20 12:25:49 +01:00			`return index + 11`
basic word functionality and conversion from string 2015-05-14 19:39:12 +02:00			`end`

copy and other improvements for word more tests reveal a bug (fixed) and more docs 2015-05-20 12:50:25 +02:00			`# compare the word to another`
			`# currently checks for same class, though really identity of the characters`
			`# in right order would suffice`
small word test 2016-12-31 14:17:45 +01:00			`def compare( other )`
fix word implementation and tests much better, though wasteful implementation breaks a few tests, but ploughing on first 2015-05-15 15:45:36 +02:00			`return false if other.class != self.class`
basic word functionality and conversion from string 2015-05-14 19:39:12 +02:00			`return false if other.length != self.length`
switch to 0 based indexing the world rocked for a moment (and more fixes to follow) also the crumbling of idealism was heard 2018-05-14 10:55:01 +02:00			`len = self.length - 1`
			`while(len >= 0)`
basic word functionality and conversion from string 2015-05-14 19:39:12 +02:00			`return false if self.get_char(len) != other.get_char(len)`
			`len = len - 1`
			`end`
			`return true`
			`end`
fix word implementation and tests much better, though wasteful implementation breaks a few tests, but ploughing on first 2015-05-15 15:45:36 +02:00
move parfait adapter into parfait ruby in the future parfait will be coded in some and translated back into ruby to “adapt” until then, all ruby code is the adapter 2015-11-18 10:55:29 +01:00			`def == other`
			`return false unless other.is_a?(String) or other.is_a?(Word)`
			`as_string = self.to_string`
			`unless other.is_a? String`
			`other = other.to_string`
			`end`
			`as_string == other`
			`end`

			`def to_string`
			`string = ""`
switch to 0 based indexing the world rocked for a moment (and more fixes to follow) also the crumbling of idealism was heard 2018-05-14 10:55:01 +02:00			`index = 0`
make all instances attr read writers unfortunately the writers have to have self.var = otherwise it is just a local var Also need to make the type explicit for all Protocol included memory_length on the class for now 2018-08-11 18:15:34 +02:00			`while( index < char_length)`
move parfait adapter into parfait ruby in the future parfait will be coded in some and translated back into ruby to “adapt” until then, all ruby code is the adapter 2015-11-18 10:55:29 +01:00			`char = get_char(index)`
			`string += char ? char.chr : "*"`
			`index = index + 1`
			`end`
			`string`
			`end`

switch to 0 based indexing the world rocked for a moment (and more fixes to follow) also the crumbling of idealism was heard 2018-05-14 10:55:01 +02:00			`# as we answered is_value? with true, rfx will create a basic node with this string`
			`def to_rfx`
fix old tests again 2015-05-24 15:55:03 +02:00			`"'" + to_s + "'"`
using sof is_value 2015-05-15 20:11:29 +02:00			`end`
test compatibility layer test from and to std/parfait objects for list and word for now moved some of that code to virtual, out of parfait 2015-05-18 09:47:29 +02:00
derive binary code form word long ago hacked the binary code to use integers (thus forsaking correct arm binaries) Finally fix by deriving from Word which now has correct binary access Dumped binary.name in the process, that is available from the method 2015-11-14 14:04:04 +01:00			`def padded_length`
make all instances attr read writers unfortunately the writers have to have self.var = otherwise it is just a local var Also need to make the type explicit for all Protocol included memory_length on the class for now 2018-08-11 18:15:34 +02:00			`Padding.padded( 4 * get_type().instance_length + char_length )`
derive binary code form word long ago hacked the binary code to use integers (thus forsaking correct arm binaries) Finally fix by deriving from Word which now has correct binary access Dumped binary.name in the process, that is available from the method 2015-11-14 14:04:04 +01:00			`end`

also giving word it's length still hacked as char per word, but should be easy enough to fix when… 2015-10-26 11:23:52 +01:00			`private`
			`def check_length`
make all instances attr read writers unfortunately the writers have to have self.var = otherwise it is just a local var Also need to make the type explicit for all Protocol included memory_length on the class for now 2018-08-11 18:15:34 +02:00			`raise "Length out of bounds #{char_length}" if char_length > 1000`
also giving word it's length still hacked as char per word, but should be easy enough to fix when… 2015-10-26 11:23:52 +01:00			`end`
rename string to word 2015-05-13 15:06:38 +02:00			`end`
move parfait adapter into parfait ruby in the future parfait will be coded in some and translated back into ruby to “adapt” until then, all ruby code is the adapter 2015-11-18 10:55:29 +01:00
rename string to word 2015-05-13 15:06:38 +02:00			`end`