kronos/gist:293163

## gistfile1.diff
From 70bbac4dbbb7eca14b73557d9ea32fb8f6df58e5 Mon Sep 17 00:00:00 2001
From: Ivan Samsonov <hronya@gmail.com>
Date: Wed, 3 Feb 2010 02:23:51 +0300
Subject: [PATCH] Speed up Array#pack
 Implement 'w' directive for String#unpack
 Speed up String#rpartition

---
 kernel/common/pack.rb                      |  425 ++++++++++++++--------------
 kernel/common/string.rb                    |   39 ++-
 spec/tags/ruby/core/string/unpack_tags.txt |    2 -
 3 files changed, 240 insertions(+), 226 deletions(-)
 delete mode 100644 spec/tags/ruby/core/string/unpack_tags.txt

diff --git a/kernel/common/pack.rb b/kernel/common/pack.rb
index e87fd09..1102856 100644
--- a/kernel/common/pack.rb
+++ b/kernel/common/pack.rb
@@ -7,7 +7,7 @@ class Array::Packer
   BASE_64_B2A[63] = '/'

   POINTER_SIZE = Rubinius::L64 ? 8 : 4
-  def initialize(array,schema)
+  def initialize(array, schema)
     @source = array
     @schema = schema
     @index = 0
@@ -19,78 +19,106 @@ class Array::Packer
     @ptr ||= FFI::MemoryPointer.new(16) # enough for all uses
   end

-  def parse(schema)
-    # The schema is an array of arrays like [["A", "6"], ["u", "*"],
-    # ["X", ""]]. It represents the parsed form of "A6u*X".  Remove
-    # strings in the schema between # and \n
-    schema = schema.gsub(/#.*/, '')
-    schema.scan(/([^\s\d!_\*])([\d!_\*]*)/)
-  end
-
   def dispatch
-    parse(@schema).each do |kind, t|
-      t = nil if t.empty?
+    schema = @schema.gsub(/#.*/, '')
+    i = 0
+    length = schema.length
+    native_size = false

-      case kind # TODO: switch kind to ints
-      when 'X'
-        size = (t || 1).to_i
-        raise ArgumentError, "you're backing up too far" if size > @result.size
-        @result.shorten!(size) if size > 0
-      when 'x'
-        size = (t || 1).to_i
-        @result << "\000" * size
-      when 'a', 'A', 'Z'
-        ascii_string(kind, t)
-      when 'b', 'B'
-        bit_string(kind, t)
-      when 'c', 'C'
-        character(kind, t)
-      when 'M'
+    while i < length do
+      kind = schema[i]
+      i += 1
+
+      next if kind.isspace
+
+      if schema[i] == ?_ or schema[i] == ?!
+        if kind == ?s or kind == ?S or kind == ?i or kind == ?I or kind == ?l or kind == ?L
+          i += 1
+          native_size = true
+        else
+          raise ArgumentError, "#{schema[i]} allowed only after types sSiIlL"
+        end
+      end
+
+      if i == length
+        len = 1
+      elsif schema[i].isdigit
+        len = 0
+        begin
+          len = len * 10 + schema[i] - ?0
+          i += 1
+        end while i < length and schema[i].isdigit
+      elsif schema[i] == ?*
+        len = case kind
+              when ?@, ?X, ?x, ?u
+                0
+              when ?P, ?M, ?m
+                1
+              when ?u, ?m, ?H, ?h, ?B, ?b, ?A, ?a, ?Z
+                nil  # size depends on item
+              else
+                @source.size - @index
+              end
+        i += 1
+      else
+        len = 1
+      end
+      case kind
+      when ?X
+        raise ArgumentError, "you're backing up too far" if len > @result.size
+        @result.shorten!(len) if len > 0
+      when ?x
+        @result << "\000" * len
+      when ?a, ?A, ?Z
+        ascii_string(kind, len)
+      when ?b, ?B
+        bit_string(kind, len)
+      when ?c, ?C
+        character(kind, len)
+      when ?M
         # for some reason MRI responds to to_s here
         item = Type.coerce_to(fetch_item(), String, :to_s)
-        line_length = 72
-        if t && t =~ /^\d/ && t.to_i >= 3
-          line_length = t.to_i
+        if len >= 3
+          line_length = len
+        else
+          line_length = 72
         end
         line_length += 1 # bug compatibility with MRI

         @result << item.scan(/.{1,#{line_length}}/m).map { |line|
           line.gsub(/[^ -<>-~\t\n]/) { |m| "=%02X" % m[0] } + "=\n"
         }.join
-      when 'm'
-        @result << encode(kind, t, :base64).join.sub(/(A{1,2})\n\Z/) { "#{'=' * $1.size}\n" }
-      when 'w'
-        ber_compress(kind, t)
-      when 'u'
-        @result << encode(kind, t, :uuencode).join.gsub(/ /, '`')
-      when 'd', 'D', 'e', 'E', 'f', 'F', 'g', 'G'
-        decimal(kind, t)
-      when 'i', 'I', 's', 'S', 'l', 'L', 'v', 'V'
-        integer(kind, t)
-      when 'N'
-        net_long(t)
-      when 'n'
-        net_short(t)
-      when 'p', 'P'
-        pointer(kind, t)
-      when 'Q', 'q'
-        integer64(kind, t)
-      when 'H', 'h'
-        hex_string(kind, t)
-      when 'U'
-        utf_string(kind, t)
-      when '@'
-        pos = if(t.nil?)
-                raise ArgumentError
-              else
-                t.to_i
-              end
-        if(pos < @result.size)
-          @result = @result[0...pos]
-        elsif(pos > @result.size)
+      when ?m
+        @result << encode(kind, len, :base64).join.sub(/(A{1,2})\n\Z/) { "#{'=' * $1.size}\n" }
+      when ?w
+        ber_compress(kind, len)
+      when ?u
+        @result << encode(kind, len, :uuencode).join.gsub(/ /, '`')
+      when ?d, ?D, ?e, ?E, ?f, ?F, ?g, ?G
+        decimal(kind, len)
+      when ?i, ?I, ?s, ?S, ?l, ?L, ?v, ?V
+        integer(kind, len, native_size)
+        native_size = false
+      when ?N
+        net_long(len)
+      when ?n
+        net_short(len)
+      when ?p, ?P
+        pointer(kind, len)
+      when ?Q, ?q
+        integer64(kind, len)
+      when ?H, ?h
+        hex_string(kind, len)
+      when ?U
+        utf_string(kind, len)
+      when ?@
+        pos = len
+        if pos < @result.size
+          @result = @result.substring(0, pos)
+        elsif pos > @result.size
           @result << "\x00" * (pos - @result.size)
         end
-      when '%'
+      when ?%
         raise ArgumentError, "#{kind} not implemented"
       end
     end
@@ -110,63 +138,49 @@ class Array::Packer
     return item
   end

-  def parse_tail(t, kind, remaining = @source.size - @index)
-    if(t != nil && (t.include?('_') || t.include?('!')))
-      unless 'sSiIlL'.include?(kind)
-        raise ArgumentError, "#{t} allowed only after types sSiIlL"
-      end
-      t = t.delete("_!")
-    end
-
-    case t
-    when nil
-      1
-    when '*'
-      remaining
-    else
-      m = t.match(/(\d+)/)
-      m ? m[0].to_i : 1
-    end
-  end
-
   # A, a, Z
-  def ascii_string(kind, t)
+  def ascii_string(kind, size)
     item = fetch_item()
     # MRI nil compatibilty for string functions
-    item = "" if item.nil?
+    item = "" unless item

-    item = Type.coerce_to(item, String, :to_str)
-    size = parse_tail(t, kind, item.size + (kind == "Z" ? 1 : 0))
+    item = StringValue(item)
+    size = item.size + (kind == ?Z ? 1 : 0) unless size

     padsize = size - item.size
-    filler  = kind == "A" ? " " : "\0"
+    filler  = kind == ?A ? " " : "\0"

-    @result << item.split(//).first(size).join
+    @result << item.substring(0, size)
     @result << filler * padsize if padsize > 0
   end

   # B, b
-  def bit_string(kind, t)
+  def bit_string(kind, size)
     item = fetch_item()
     # MRI nil compatibilty for string functions
-    item = "" if item.nil?
+    item = "" unless item

-    item = Type.coerce_to(item, String, :to_str)
+    item = StringValue(item)
     byte = 0
-    lsb  = (kind == "b")
-    size = parse_tail(t, kind, item.size)
+    lsb  = (kind == ?b)
+    size = item.size unless size

-    bits = item.split(//).map { |c| c[0] & 01 }
-    min = [size, item.size].min
+    min = size < item.size ? size : item.size

-    bits.first(min).each_with_index do |bit, i| # TODO: this can be cleaner
-      i &= 07
+    if min > 0
+      i = 0
+      item.each_byte do |bit|
+        bit &= 01
+        j = i & 07
+        byte |= bit << (lsb ? j : 07 - j)

-      byte |= bit << (lsb ? i : 07 - i)
+        if j == 07
+          @result << byte.chr
+          byte = 0
+        end

-      if i == 07
-        @result << byte.chr
-        byte = 0
+        i += 1
+        break if i >= min
       end
     end

@@ -180,48 +194,48 @@ class Array::Packer
   end

   # C, c
-  def character(kind, t)
-    parse_tail(t, kind).times do
+  def character(kind, size)
+    size.times do
       @result << (Type.coerce_to(fetch_item(), Integer, :to_int) & 0xff).chr
     end
   end

   # P, p
-  def pointer(kind, t)
-    count = parse_tail(t, kind, kind == 'p' ? @source.size - @index : 1)
-    raise ArgumentError, "too few array elements" if
-      @index + count > @source.length && kind == 'p'
-
-    count.times do
+  def pointer(kind, size)
+    size.times do
       item = fetch_item()
-      if(item == nil)
-        @result << "\x00"*POINTER_SIZE
+      unless item
+        @result << "\x00" * POINTER_SIZE
       else
-        item = StringValue item
+        item = StringValue(item)
         raise ArgumentError, "not implemented"
       end
     end
   end

   # H, h
-  def hex_string(kind, t)
-    item = Type.coerce_to(fetch_item(), String, :to_str)
+  def hex_string(kind, size)
+    item = StringValue(fetch_item())

     # MRI nil compatibilty for string functions
-    item = "" if item.nil?
-
-    size = parse_tail(t, kind, item.length)
-    str = item[0, size].scan(/..?/)
+    item = "" unless item

-    numbers = if kind == "h"
-                str.map { |b| b.reverse.hex }
-              else
-                str.map { |b| b.        hex }
-              end
+    size = item.length unless size

-    if kind == 'H' && !numbers.empty? && numbers.last < 16
-      numbers[-1] *= 16
+    str = item.substring(0, size)
+    tail = nil
+    if kind == ?h
+      0.step(str.length-2, 2) do |i|
+        @result << "#{item[i+1].chr}#{item[i].chr}".hex.chr
+      end
+    else
+      0.step(str.length-2, 2) do |i|
+        @result << item.substring(i, 2).hex.chr
+      end
     end
+    tail = item.substring(str.length-1, 1).hex.chr if str.length % 2 == 1
+
+    @result << (kind == ?H ? (tail[0]*16).chr : tail) if tail

     diff = size - item.length

@@ -234,57 +248,38 @@ class Array::Packer
         left = diff / 2
       end

-      left.times do
-        numbers << 0
-      end
+      @result << "\000" * left
     end
-
-    @result << numbers.map { |n| n.chr }.join
   end

-  def decimal(kind, t)
-    size = parse_tail(t, kind)
-
+  def decimal(kind, size)
     want_double = case kind
-                  when 'E', 'D', 'd', 'G' then true
-                  when 'e', 'F', 'f', 'g' then false
+                  when ?E, ?D, ?d, ?G then true
+                  when ?e, ?F, ?f, ?g then false
                   end

     little_endian = case kind
-                    when 'e', 'E' then true
-                    when 'g', 'G' then false
+                    when ?e, ?E then true
+                    when ?g, ?G then false
                     else endian?(:little)
                     end

     size.times do
-      item = fetch_item()
-      item = FloatValue item
+      item = FloatValue(fetch_item())
       bytes = item.to_packed(want_double)
       bytes.reverse! if little_endian ^ endian?(:little)
       @result << bytes
     end
   end

-  QUAD_MAX = 2 ** 64
-  MAX = 2 ** Rubinius::WORDSIZE
+  QUAD_MAX = 1 << 64
+  MAX = 1 << Rubinius::WORDSIZE

   # Q, q
-  def integer64(kind, t)
-    size = parse_tail(t, kind)
-
-    bytes = 8
-
-    little_endian = true
-
-    if @index + size > @source.length
-      raise ArgumentError, "too few array elements"
-    end
-
+  def integer64(kind, size)
     size.times do |i|
       val = Type.coerce_to(fetch_item, Integer, :to_int)

-      max_wordsize = 64
-
       if val.abs >= QUAD_MAX
         raise RangeError, "bignum too big to convert into 'unsigned long'"
       end
@@ -295,14 +290,8 @@ class Array::Packer
   end

   # N
-  def net_long(t)
-    size = parse_tail(t, 'N')
-
-    if @index + size > @source.length
-      raise ArgumentError, "too few array elements"
-    end
-
-    size.times do |i|
+  def net_long(size)
+    size.times do
       val = Type.coerce_to(fetch_item, Integer, :to_int)

       # These ranges checks are so stupid. They don't even check the actual
@@ -318,14 +307,8 @@ class Array::Packer
   end

   # n
-  def net_short(t)
-    size = parse_tail(t, 'n')
-
-    if @index + size > @source.length
-      raise ArgumentError, "too few array elements"
-    end
-
-    size.times do |i|
+  def net_short(size)
+    size.times do
       val = Type.coerce_to(fetch_item, Integer, :to_int)

       # These ranges checks are so stupid. They don't even check the actual
@@ -341,58 +324,50 @@ class Array::Packer
   end

   # i, s, l, I, S, L, V, v
-  def integer(kind, t)
-    size = parse_tail(t, kind)
-
-    if(t && (t.include?('_') || t.include?('!')))
+  def integer(kind, size, native_size)
+    if native_size
       # Native sizes
       bytes = case kind
-              when 'L', 'l' then Rubinius::SIZEOF_LONG
-              when 'I', 'i' then Rubinius::SIZEOF_INT
-              when 'S', 's' then Rubinius::SIZEOF_SHORT
+              when ?L, ?l then Rubinius::SIZEOF_LONG
+              when ?I, ?i then Rubinius::SIZEOF_INT
+              when ?S, ?s then Rubinius::SIZEOF_SHORT
               end
     else
       bytes = case kind
-              when 'L', 'l' then 4
-              when 'I', 'i' then 4
-              when 'S', 's' then 2
-              when 'V'      then 4
-              when 'v'      then 2
+              when ?L, ?l, ?I, ?i, ?V then 4
+              when ?S, ?s, ?v         then 2
               end
     end

-    unsigned      = (kind =~ /I|S|L/)
+    unsigned      = kind == ?I or kind == ?S or kind == ?L
     little_endian = case kind
-                    when 'V', 'v' then true
+                    when ?V, ?v then true
                     else endian?(:little)
                     end

-    raise ArgumentError, "too few array elements" if
-      @index + size > @source.length
-
-    size.times do |i|
+    size.times do
       item = Type.coerce_to(fetch_item(), Integer, :to_int)

       if item.abs >= MAX
         raise RangeError, "bignum too big to convert into 'unsigned long'"
       end

-        @result << if little_endian
-                     item += 2 ** (8 * bytes) if item < 0
-                     (0...bytes).map { |b| ((item >> (b * 8)) & 0xFF).chr }
-                   else # ugly
-                     (0...bytes).map {n=(item & 0xFF).chr;item >>= 8; n}.reverse
-                   end.join
+      if little_endian
+        item += 1 << (8 * bytes) if item < 0
+        bytes.times { |b| @result << ((item >> (b * 8)) & 0xFF).chr }
+      else # ugly
+        @result << (0...bytes).map {n=(item & 0xFF).chr;item >>= 8; n}.reverse.join
+      end
     end
   end

   # w
-  def ber_compress(kind, t)
-    parse_tail(t, kind).times do
-      chars = ''
+  def ber_compress(kind, size)
+    size.times do
       item = Type.coerce_to(fetch_item(), Integer, :to_int)
       raise ArgumentError, "can't compress negative numbers" if item < 0

+      chars = ''
       chars << (item & 0x7f)
       while (item >>= 7) > 0 do
         chars << ((item & 0x7f) | 0x80)
@@ -402,12 +377,12 @@ class Array::Packer
   end

   # u, m
-  def encode(kind, t, type = :base64)
-    item = Type.coerce_to(fetch_item(), String, :to_str)
+  def encode(kind, size, type = :base64)
+    item = StringValue(fetch_item())

     line_length = 45
-    if t && t =~ /^\d/ && t.to_i >= 3
-      line_length = t.to_i
+    if size >= 3
+      line_length = size
       line_length -= line_length % 3
     end

@@ -431,7 +406,7 @@ class Array::Packer

       l = "#{encoded.join}\n"
       if(type == :uuencode)
-        (line.size + ?\s).chr+l
+        (line.size + ?\s).chr + l
       else
         l
       end
@@ -439,38 +414,36 @@ class Array::Packer
   end

   # U
-  def utf_string(kind, t)
-    parse_tail(t, kind).times do
+  def utf_string(kind, size)
+    size.times do
       item = Type.coerce_to(fetch_item(), Integer, :to_i)

       raise RangeError, "pack(U): value out of range" if item < 0

       bytes = 0
-      f = [2 ** 7, 2 ** 11, 2 ** 16, 2 ** 21, 2 ** 26, 2 ** 31].find { |n|
+
+      f = [1 << 7, 1 << 11, 1 << 16, 1 << 21, 1 << 26, 1 << 31].find do |n|
         bytes += 1
         item < n
-      }
+      end

-      raise RangeError, "pack(U): value out of range" if f.nil?
+      raise RangeError, "pack(U): value out of range" unless f

       if bytes == 1
         @result << item
-        bytes = 0
-      end
-
-      i = bytes
+      else
+        i = bytes
+        buf = []

-      buf = []
-      if i > 0
         (i-1).times do
-          buf.unshift((item | 0x80) & 0xBF)
+          buf.unshift(((item | 0x80) & 0xBF).chr)
           item >>= 6
         end
         # catch the highest bits - the mask depends on the byte count
-        buf.unshift(item | ((0x3F00 >> bytes)) & 0xFC)
-      end
+        buf.unshift((item | ((0x3F00 >> bytes)) & 0xFC).chr)

-      @result << buf.map { |n| n.chr }.join
+        @result << buf.join
+      end
     end
   end
 end
@@ -632,6 +605,26 @@ class String::Unpacker
     return i
   end

+  def ber_decompress(i, count, elements)
+    count = @length - i if count == '*'
+
+    count.times do
+      n = 0
+      while i < @length do
+        item = @source[i]
+        i += 1
+        n <<= 7
+        n |= item & 0x7f
+        if item & 0x80 == 0
+          elements << n
+          break
+        end
+      end
+    end
+
+    return i
+  end
+
   # Like int, but always does 4 bytes.
   def long(i, count, elements, signed)
     # TODO honor _.
@@ -922,6 +915,8 @@ class String::Unpacker
         i = base64(i, count, elements)
       when 'U'
         i = utf8(i, count, elements)
+      when 'w'
+        i = ber_decompress(i, count, elements)
       when 'X'
         count = length - i if count == '*'

diff --git a/kernel/common/string.rb b/kernel/common/string.rb
index 89205b6..c811f0e 100644
--- a/kernel/common/string.rb
+++ b/kernel/common/string.rb
@@ -1280,17 +1280,38 @@ class String
     return [self, "", ""]
   end

+  # call-seq:
+  #
+  #    str.rpartition(sep)             => [head, sep, tail]
+  #    str.rpartition(regexp)          => [head, match, tail]
+  #
+  # Searches _sep_ or pattern (_regexp_) in the string from the end
+  # of the string, and returns the part before it, the match, and the part
+  # after it.
+  # If it is not found, returns two empty strings and _str_.
+  #
+  #    "hello".rpartition("l")         #=> ["hel", "l", "o"]
+  #    "hello".rpartition("x")         #=> ["", "", "hello"]
+  #    "hello".rpartition(/.l/)        #=> ["he", "ll", "o"]
+  #
   def rpartition(pattern)
-    pattern = Type.coerce_to(pattern, String, :to_str) unless pattern.is_a? Regexp
-    i = rindex(pattern)
-    return ["", "", self] unless i
-
-    if pattern.is_a? Regexp
-      match = Regexp.last_match
-      [match.pre_match, match[0], match.post_match]
+    if pattern.kind_of? Regexp
+      if m = pattern.search_region(self, 0, size, false)
+        [m.pre_match, m[0], m.post_match]
+      end
     else
-      last = i+pattern.length
-      [self[0...i], self[i...last], self[last...length]]
+      pattern = StringValue(pattern)
+      if i = rindex(pattern)
+        post_start = i + pattern.length
+        post_len = size - post_start
+
+        return [self.substring(0, i),
+                pattern.dup,
+                self.substring(post_start, post_len)]
+      end
+
+      # Nothing worked out, this is the default.
+      return ["", "", self]
     end
   end

diff --git a/spec/tags/ruby/core/string/unpack_tags.txt b/spec/tags/ruby/core/string/unpack_tags.txt
deleted file mode 100644
index 37de522..0000000
--- a/spec/tags/ruby/core/string/unpack_tags.txt
+++ /dev/null
@@ -1,2 +0,0 @@
-fails:String#unpack with 'w' directive produces a BER-compressed integer
-fails:String#unpack with 'w' directive produces a BER-compressed integer
--
1.6.1
	From 70bbac4dbbb7eca14b73557d9ea32fb8f6df58e5 Mon Sep 17 00:00:00 2001
	From: Ivan Samsonov <hronya@gmail.com>
	Date: Wed, 3 Feb 2010 02:23:51 +0300
	Subject: [PATCH] Speed up Array#pack
	Implement 'w' directive for String#unpack
	Speed up String#rpartition

	---
	kernel/common/pack.rb \| 425 ++++++++++++++--------------
	kernel/common/string.rb \| 39 ++-
	spec/tags/ruby/core/string/unpack_tags.txt \| 2 -
	3 files changed, 240 insertions(+), 226 deletions(-)
	delete mode 100644 spec/tags/ruby/core/string/unpack_tags.txt

	diff --git a/kernel/common/pack.rb b/kernel/common/pack.rb
	index e87fd09..1102856 100644
	--- a/kernel/common/pack.rb
	+++ b/kernel/common/pack.rb
	@@ -7,7 +7,7 @@ class Array::Packer
	BASE_64_B2A[63] = '/'

	POINTER_SIZE = Rubinius::L64 ? 8 : 4
	- def initialize(array,schema)
	+ def initialize(array, schema)
	@source = array
	@schema = schema
	@index = 0
	@@ -19,78 +19,106 @@ class Array::Packer
	@ptr \|\|= FFI::MemoryPointer.new(16) # enough for all uses
	end

	- def parse(schema)
	- # The schema is an array of arrays like [["A", "6"], ["u", "*"],
	- # ["X", ""]]. It represents the parsed form of "A6u*X". Remove
	- # strings in the schema between # and \n
	- schema = schema.gsub(/#.*/, '')
	- schema.scan(/([^\s\d!_\])([\d!_\]*)/)
	- end
	-
	def dispatch
	- parse(@schema).each do \|kind, t\|
	- t = nil if t.empty?
	+ schema = @schema.gsub(/#.*/, '')
	+ i = 0
	+ length = schema.length
	+ native_size = false

	- case kind # TODO: switch kind to ints
	- when 'X'
	- size = (t \|\| 1).to_i
	- raise ArgumentError, "you're backing up too far" if size > @result.size
	- @result.shorten!(size) if size > 0
	- when 'x'
	- size = (t \|\| 1).to_i
	- @result << "\000" * size
	- when 'a', 'A', 'Z'
	- ascii_string(kind, t)
	- when 'b', 'B'
	- bit_string(kind, t)
	- when 'c', 'C'
	- character(kind, t)
	- when 'M'
	+ while i < length do
	+ kind = schema[i]
	+ i += 1
	+
	+ next if kind.isspace
	+
	+ if schema[i] == ?_ or schema[i] == ?!
	+ if kind == ?s or kind == ?S or kind == ?i or kind == ?I or kind == ?l or kind == ?L
	+ i += 1
	+ native_size = true
	+ else
	+ raise ArgumentError, "#{schema[i]} allowed only after types sSiIlL"
	+ end
	+ end
	+
	+ if i == length
	+ len = 1
	+ elsif schema[i].isdigit
	+ len = 0
	+ begin
	+ len = len * 10 + schema[i] - ?0
	+ i += 1
	+ end while i < length and schema[i].isdigit
	+ elsif schema[i] == ?*
	+ len = case kind
	+ when ?@, ?X, ?x, ?u
	+ 0
	+ when ?P, ?M, ?m
	+ 1
	+ when ?u, ?m, ?H, ?h, ?B, ?b, ?A, ?a, ?Z
	+ nil # size depends on item
	+ else
	+ @source.size - @index
	+ end
	+ i += 1
	+ else
	+ len = 1
	+ end
	+ case kind
	+ when ?X
	+ raise ArgumentError, "you're backing up too far" if len > @result.size
	+ @result.shorten!(len) if len > 0
	+ when ?x
	+ @result << "\000" * len
	+ when ?a, ?A, ?Z
	+ ascii_string(kind, len)
	+ when ?b, ?B
	+ bit_string(kind, len)
	+ when ?c, ?C
	+ character(kind, len)
	+ when ?M
	# for some reason MRI responds to to_s here
	item = Type.coerce_to(fetch_item(), String, :to_s)
	- line_length = 72
	- if t && t =~ /^\d/ && t.to_i >= 3
	- line_length = t.to_i
	+ if len >= 3
	+ line_length = len
	+ else
	+ line_length = 72
	end
	line_length += 1 # bug compatibility with MRI

	@result << item.scan(/.{1,#{line_length}}/m).map { \|line\|
	line.gsub(/[^ -<>-~\t\n]/) { \|m\| "=%02X" % m[0] } + "=\n"
	}.join
	- when 'm'
	- @result << encode(kind, t, :base64).join.sub(/(A{1,2})\n\Z/) { "#{'=' * $1.size}\n" }
	- when 'w'
	- ber_compress(kind, t)
	- when 'u'
	- @result << encode(kind, t, :uuencode).join.gsub(/ /, '`')
	- when 'd', 'D', 'e', 'E', 'f', 'F', 'g', 'G'
	- decimal(kind, t)
	- when 'i', 'I', 's', 'S', 'l', 'L', 'v', 'V'
	- integer(kind, t)
	- when 'N'
	- net_long(t)
	- when 'n'
	- net_short(t)
	- when 'p', 'P'
	- pointer(kind, t)
	- when 'Q', 'q'
	- integer64(kind, t)
	- when 'H', 'h'
	- hex_string(kind, t)
	- when 'U'
	- utf_string(kind, t)
	- when '@'
	- pos = if(t.nil?)
	- raise ArgumentError
	- else
	- t.to_i
	- end
	- if(pos < @result.size)
	- @result = @result[0...pos]
	- elsif(pos > @result.size)
	+ when ?m
	+ @result << encode(kind, len, :base64).join.sub(/(A{1,2})\n\Z/) { "#{'=' * $1.size}\n" }
	+ when ?w
	+ ber_compress(kind, len)
	+ when ?u
	+ @result << encode(kind, len, :uuencode).join.gsub(/ /, '`')
	+ when ?d, ?D, ?e, ?E, ?f, ?F, ?g, ?G
	+ decimal(kind, len)
	+ when ?i, ?I, ?s, ?S, ?l, ?L, ?v, ?V
	+ integer(kind, len, native_size)
	+ native_size = false
	+ when ?N
	+ net_long(len)
	+ when ?n
	+ net_short(len)
	+ when ?p, ?P
	+ pointer(kind, len)
	+ when ?Q, ?q
	+ integer64(kind, len)
	+ when ?H, ?h
	+ hex_string(kind, len)
	+ when ?U
	+ utf_string(kind, len)
	+ when ?@
	+ pos = len
	+ if pos < @result.size
	+ @result = @result.substring(0, pos)
	+ elsif pos > @result.size
	@result << "\x00" * (pos - @result.size)
	end
	- when '%'
	+ when ?%
	raise ArgumentError, "#{kind} not implemented"
	end
	end
	@@ -110,63 +138,49 @@ class Array::Packer
	return item
	end

	- def parse_tail(t, kind, remaining = @source.size - @index)
	- if(t != nil && (t.include?('_') \|\| t.include?('!')))
	- unless 'sSiIlL'.include?(kind)
	- raise ArgumentError, "#{t} allowed only after types sSiIlL"
	- end
	- t = t.delete("_!")
	- end
	-
	- case t
	- when nil
	- 1
	- when '*'
	- remaining
	- else
	- m = t.match(/(\d+)/)
	- m ? m[0].to_i : 1
	- end
	- end
	-
	# A, a, Z
	- def ascii_string(kind, t)
	+ def ascii_string(kind, size)
	item = fetch_item()
	# MRI nil compatibilty for string functions
	- item = "" if item.nil?
	+ item = "" unless item

	- item = Type.coerce_to(item, String, :to_str)
	- size = parse_tail(t, kind, item.size + (kind == "Z" ? 1 : 0))
	+ item = StringValue(item)
	+ size = item.size + (kind == ?Z ? 1 : 0) unless size

	padsize = size - item.size
	- filler = kind == "A" ? " " : "\0"
	+ filler = kind == ?A ? " " : "\0"

	- @result << item.split(//).first(size).join
	+ @result << item.substring(0, size)
	@result << filler * padsize if padsize > 0
	end

	# B, b
	- def bit_string(kind, t)
	+ def bit_string(kind, size)
	item = fetch_item()
	# MRI nil compatibilty for string functions
	- item = "" if item.nil?
	+ item = "" unless item

	- item = Type.coerce_to(item, String, :to_str)
	+ item = StringValue(item)
	byte = 0
	- lsb = (kind == "b")
	- size = parse_tail(t, kind, item.size)
	+ lsb = (kind == ?b)
	+ size = item.size unless size

	- bits = item.split(//).map { \|c\| c[0] & 01 }
	- min = [size, item.size].min
	+ min = size < item.size ? size : item.size

	- bits.first(min).each_with_index do \|bit, i\| # TODO: this can be cleaner
	- i &= 07
	+ if min > 0
	+ i = 0
	+ item.each_byte do \|bit\|
	+ bit &= 01
	+ j = i & 07
	+ byte \|= bit << (lsb ? j : 07 - j)

	- byte \|= bit << (lsb ? i : 07 - i)
	+ if j == 07
	+ @result << byte.chr
	+ byte = 0
	+ end

	- if i == 07
	- @result << byte.chr
	- byte = 0
	+ i += 1
	+ break if i >= min
	end
	end

	@@ -180,48 +194,48 @@ class Array::Packer
	end

	# C, c
	- def character(kind, t)
	- parse_tail(t, kind).times do
	+ def character(kind, size)
	+ size.times do
	@result << (Type.coerce_to(fetch_item(), Integer, :to_int) & 0xff).chr
	end
	end

	# P, p
	- def pointer(kind, t)
	- count = parse_tail(t, kind, kind == 'p' ? @source.size - @index : 1)
	- raise ArgumentError, "too few array elements" if
	- @index + count > @source.length && kind == 'p'
	-
	- count.times do
	+ def pointer(kind, size)
	+ size.times do
	item = fetch_item()
	- if(item == nil)
	- @result << "\x00"*POINTER_SIZE
	+ unless item
	+ @result << "\x00" * POINTER_SIZE
	else
	- item = StringValue item
	+ item = StringValue(item)
	raise ArgumentError, "not implemented"
	end
	end
	end

	# H, h
	- def hex_string(kind, t)
	- item = Type.coerce_to(fetch_item(), String, :to_str)
	+ def hex_string(kind, size)
	+ item = StringValue(fetch_item())

	# MRI nil compatibilty for string functions
	- item = "" if item.nil?
	-
	- size = parse_tail(t, kind, item.length)
	- str = item[0, size].scan(/..?/)
	+ item = "" unless item

	- numbers = if kind == "h"
	- str.map { \|b\| b.reverse.hex }
	- else
	- str.map { \|b\| b. hex }
	- end
	+ size = item.length unless size

	- if kind == 'H' && !numbers.empty? && numbers.last < 16
	- numbers[-1] *= 16
	+ str = item.substring(0, size)
	+ tail = nil
	+ if kind == ?h
	+ 0.step(str.length-2, 2) do \|i\|
	+ @result << "#{item[i+1].chr}#{item[i].chr}".hex.chr
	+ end
	+ else
	+ 0.step(str.length-2, 2) do \|i\|
	+ @result << item.substring(i, 2).hex.chr
	+ end
	end
	+ tail = item.substring(str.length-1, 1).hex.chr if str.length % 2 == 1
	+
	+ @result << (kind == ?H ? (tail[0]*16).chr : tail) if tail

	diff = size - item.length

	@@ -234,57 +248,38 @@ class Array::Packer
	left = diff / 2
	end

	- left.times do
	- numbers << 0
	- end
	+ @result << "\000" * left
	end
	-
	- @result << numbers.map { \|n\| n.chr }.join
	end

	- def decimal(kind, t)
	- size = parse_tail(t, kind)
	-
	+ def decimal(kind, size)
	want_double = case kind
	- when 'E', 'D', 'd', 'G' then true
	- when 'e', 'F', 'f', 'g' then false
	+ when ?E, ?D, ?d, ?G then true
	+ when ?e, ?F, ?f, ?g then false
	end

	little_endian = case kind
	- when 'e', 'E' then true
	- when 'g', 'G' then false
	+ when ?e, ?E then true
	+ when ?g, ?G then false
	else endian?(:little)
	end

	size.times do
	- item = fetch_item()
	- item = FloatValue item
	+ item = FloatValue(fetch_item())
	bytes = item.to_packed(want_double)
	bytes.reverse! if little_endian ^ endian?(:little)
	@result << bytes
	end
	end

	- QUAD_MAX = 2 ** 64
	- MAX = 2 ** Rubinius::WORDSIZE
	+ QUAD_MAX = 1 << 64
	+ MAX = 1 << Rubinius::WORDSIZE

	# Q, q
	- def integer64(kind, t)
	- size = parse_tail(t, kind)
	-
	- bytes = 8
	-
	- little_endian = true
	-
	- if @index + size > @source.length
	- raise ArgumentError, "too few array elements"
	- end
	-
	+ def integer64(kind, size)
	size.times do \|i\|
	val = Type.coerce_to(fetch_item, Integer, :to_int)

	- max_wordsize = 64
	-
	if val.abs >= QUAD_MAX
	raise RangeError, "bignum too big to convert into 'unsigned long'"
	end
	@@ -295,14 +290,8 @@ class Array::Packer
	end

	# N
	- def net_long(t)
	- size = parse_tail(t, 'N')
	-
	- if @index + size > @source.length
	- raise ArgumentError, "too few array elements"
	- end
	-
	- size.times do \|i\|
	+ def net_long(size)
	+ size.times do
	val = Type.coerce_to(fetch_item, Integer, :to_int)

	# These ranges checks are so stupid. They don't even check the actual
	@@ -318,14 +307,8 @@ class Array::Packer
	end

	# n
	- def net_short(t)
	- size = parse_tail(t, 'n')
	-
	- if @index + size > @source.length
	- raise ArgumentError, "too few array elements"
	- end
	-
	- size.times do \|i\|
	+ def net_short(size)
	+ size.times do
	val = Type.coerce_to(fetch_item, Integer, :to_int)

	# These ranges checks are so stupid. They don't even check the actual
	@@ -341,58 +324,50 @@ class Array::Packer
	end

	# i, s, l, I, S, L, V, v
	- def integer(kind, t)
	- size = parse_tail(t, kind)
	-
	- if(t && (t.include?('_') \|\| t.include?('!')))
	+ def integer(kind, size, native_size)
	+ if native_size
	# Native sizes
	bytes = case kind
	- when 'L', 'l' then Rubinius::SIZEOF_LONG
	- when 'I', 'i' then Rubinius::SIZEOF_INT
	- when 'S', 's' then Rubinius::SIZEOF_SHORT
	+ when ?L, ?l then Rubinius::SIZEOF_LONG
	+ when ?I, ?i then Rubinius::SIZEOF_INT
	+ when ?S, ?s then Rubinius::SIZEOF_SHORT
	end
	else
	bytes = case kind
	- when 'L', 'l' then 4
	- when 'I', 'i' then 4
	- when 'S', 's' then 2
	- when 'V' then 4
	- when 'v' then 2
	+ when ?L, ?l, ?I, ?i, ?V then 4
	+ when ?S, ?s, ?v then 2
	end
	end

	- unsigned = (kind =~ /I\|S\|L/)
	+ unsigned = kind == ?I or kind == ?S or kind == ?L
	little_endian = case kind
	- when 'V', 'v' then true
	+ when ?V, ?v then true
	else endian?(:little)
	end

	- raise ArgumentError, "too few array elements" if
	- @index + size > @source.length
	-
	- size.times do \|i\|
	+ size.times do
	item = Type.coerce_to(fetch_item(), Integer, :to_int)

	if item.abs >= MAX
	raise RangeError, "bignum too big to convert into 'unsigned long'"
	end

	- @result << if little_endian
	- item += 2 ** (8 * bytes) if item < 0
	- (0...bytes).map { \|b\| ((item >> (b * 8)) & 0xFF).chr }
	- else # ugly
	- (0...bytes).map {n=(item & 0xFF).chr;item >>= 8; n}.reverse
	- end.join
	+ if little_endian
	+ item += 1 << (8 * bytes) if item < 0
	+ bytes.times { \|b\| @result << ((item >> (b * 8)) & 0xFF).chr }
	+ else # ugly
	+ @result << (0...bytes).map {n=(item & 0xFF).chr;item >>= 8; n}.reverse.join
	+ end
	end
	end

	# w
	- def ber_compress(kind, t)
	- parse_tail(t, kind).times do
	- chars = ''
	+ def ber_compress(kind, size)
	+ size.times do
	item = Type.coerce_to(fetch_item(), Integer, :to_int)
	raise ArgumentError, "can't compress negative numbers" if item < 0

	+ chars = ''
	chars << (item & 0x7f)
	while (item >>= 7) > 0 do
	chars << ((item & 0x7f) \| 0x80)
	@@ -402,12 +377,12 @@ class Array::Packer
	end

	# u, m
	- def encode(kind, t, type = :base64)
	- item = Type.coerce_to(fetch_item(), String, :to_str)
	+ def encode(kind, size, type = :base64)
	+ item = StringValue(fetch_item())

	line_length = 45
	- if t && t =~ /^\d/ && t.to_i >= 3
	- line_length = t.to_i
	+ if size >= 3
	+ line_length = size
	line_length -= line_length % 3
	end

	@@ -431,7 +406,7 @@ class Array::Packer

	l = "#{encoded.join}\n"
	if(type == :uuencode)
	- (line.size + ?\s).chr+l
	+ (line.size + ?\s).chr + l
	else
	l
	end
	@@ -439,38 +414,36 @@ class Array::Packer
	end

	# U
	- def utf_string(kind, t)
	- parse_tail(t, kind).times do
	+ def utf_string(kind, size)
	+ size.times do
	item = Type.coerce_to(fetch_item(), Integer, :to_i)

	raise RangeError, "pack(U): value out of range" if item < 0

	bytes = 0
	- f = [2 7, 2 11, 2 16, 2 21, 2 26, 2 31].find { \|n\|
	+
	+ f = [1 << 7, 1 << 11, 1 << 16, 1 << 21, 1 << 26, 1 << 31].find do \|n\|
	bytes += 1
	item < n
	- }
	+ end

	- raise RangeError, "pack(U): value out of range" if f.nil?
	+ raise RangeError, "pack(U): value out of range" unless f

	if bytes == 1
	@result << item
	- bytes = 0
	- end
	-
	- i = bytes
	+ else
	+ i = bytes
	+ buf = []

	- buf = []
	- if i > 0
	(i-1).times do
	- buf.unshift((item \| 0x80) & 0xBF)
	+ buf.unshift(((item \| 0x80) & 0xBF).chr)
	item >>= 6
	end
	# catch the highest bits - the mask depends on the byte count
	- buf.unshift(item \| ((0x3F00 >> bytes)) & 0xFC)
	- end
	+ buf.unshift((item \| ((0x3F00 >> bytes)) & 0xFC).chr)

	- @result << buf.map { \|n\| n.chr }.join
	+ @result << buf.join
	+ end
	end
	end
	end
	@@ -632,6 +605,26 @@ class String::Unpacker
	return i
	end

	+ def ber_decompress(i, count, elements)
	+ count = @length - i if count == '*'
	+
	+ count.times do
	+ n = 0
	+ while i < @length do
	+ item = @source[i]
	+ i += 1
	+ n <<= 7
	+ n \|= item & 0x7f
	+ if item & 0x80 == 0
	+ elements << n
	+ break
	+ end
	+ end
	+ end
	+
	+ return i
	+ end
	+
	# Like int, but always does 4 bytes.
	def long(i, count, elements, signed)
	# TODO honor _.
	@@ -922,6 +915,8 @@ class String::Unpacker
	i = base64(i, count, elements)
	when 'U'
	i = utf8(i, count, elements)
	+ when 'w'
	+ i = ber_decompress(i, count, elements)
	when 'X'
	count = length - i if count == '*'

	diff --git a/kernel/common/string.rb b/kernel/common/string.rb
	index 89205b6..c811f0e 100644
	--- a/kernel/common/string.rb
	+++ b/kernel/common/string.rb
	@@ -1280,17 +1280,38 @@ class String
	return [self, "", ""]
	end

	+ # call-seq:
	+ #
	+ # str.rpartition(sep) => [head, sep, tail]
	+ # str.rpartition(regexp) => [head, match, tail]
	+ #
	+ # Searches _sep_ or pattern (_regexp_) in the string from the end
	+ # of the string, and returns the part before it, the match, and the part
	+ # after it.
	+ # If it is not found, returns two empty strings and _str_.
	+ #
	+ # "hello".rpartition("l") #=> ["hel", "l", "o"]
	+ # "hello".rpartition("x") #=> ["", "", "hello"]
	+ # "hello".rpartition(/.l/) #=> ["he", "ll", "o"]
	+ #
	def rpartition(pattern)
	- pattern = Type.coerce_to(pattern, String, :to_str) unless pattern.is_a? Regexp
	- i = rindex(pattern)
	- return ["", "", self] unless i
	-
	- if pattern.is_a? Regexp
	- match = Regexp.last_match
	- [match.pre_match, match[0], match.post_match]
	+ if pattern.kind_of? Regexp
	+ if m = pattern.search_region(self, 0, size, false)
	+ [m.pre_match, m[0], m.post_match]
	+ end
	else
	- last = i+pattern.length
	- [self[0...i], self[i...last], self[last...length]]
	+ pattern = StringValue(pattern)
	+ if i = rindex(pattern)
	+ post_start = i + pattern.length
	+ post_len = size - post_start
	+
	+ return [self.substring(0, i),
	+ pattern.dup,
	+ self.substring(post_start, post_len)]
	+ end
	+
	+ # Nothing worked out, this is the default.
	+ return ["", "", self]
	end
	end

	diff --git a/spec/tags/ruby/core/string/unpack_tags.txt b/spec/tags/ruby/core/string/unpack_tags.txt
	deleted file mode 100644
	index 37de522..0000000
	--- a/spec/tags/ruby/core/string/unpack_tags.txt
	+++ /dev/null
	@@ -1,2 +0,0 @@
	-fails:String#unpack with 'w' directive produces a BER-compressed integer
	-fails:String#unpack with 'w' directive produces a BER-compressed integer
	--
	1.6.1