diff --git a/lib/node.rb b/lib/node.rb
deleted file mode 100644
index 34191b90..00000000
--- a/lib/node.rb
+++ /dev/null
@@ -1,530 +0,0 @@
-require 'strscan'
-
-module XHTML #:nodoc:
-  
-  class Conditions < Hash #:nodoc:
-    def initialize(hash)
-      super()
-      hash = { :content => hash } unless Hash === hash
-      hash = keys_to_symbols(hash)
-      hash.each do |k,v|
-        case k
-          when :tag, :content then
-            # keys are valid, and require no further processing
-          when :attributes then
-            hash[k] = keys_to_strings(v)
-          when :parent, :child, :ancestor, :descendant, :sibling, :before,
-                  :after
-            hash[k] = Conditions.new(v)
-          when :children
-            hash[k] = v = keys_to_symbols(v)
-            v.each do |k,v2|
-              case k
-                when :count, :greater_than, :less_than
-                  # keys are valid, and require no further processing
-                when :only
-                  v[k] = Conditions.new(v2)
-                else
-                  raise "illegal key #{k.inspect} => #{v2.inspect}"
-              end
-            end
-          else
-            raise "illegal key #{k.inspect} => #{v.inspect}"
-        end
-      end
-      update hash
-    end
-
-    private
-
-      def keys_to_strings(hash)
-        hash.keys.inject({}) do |h,k|
-          h[k.to_s] = hash[k]
-          h
-        end
-      end
-
-      def keys_to_symbols(hash)
-        hash.keys.inject({}) do |h,k|
-          raise "illegal key #{k.inspect}" unless k.respond_to?(:to_sym)
-          h[k.to_sym] = hash[k]
-          h
-        end
-      end
-  end
-
-  # The base class of all nodes, textual and otherwise, in an HTML document.
-  class Node #:nodoc:
-    # The array of children of this node. Not all nodes have children.
-    attr_reader :children
-    
-    # The parent node of this node. All nodes have a parent, except for the
-    # root node.
-    attr_reader :parent
-    
-    # The line number of the input where this node was begun
-    attr_reader :line
-    
-    # The byte position in the input where this node was begun
-    attr_reader :position
-    
-    # Create a new node as a child of the given parent.
-    def initialize(parent, line=0, pos=0)
-      @parent = parent
-      @children = []
-      @line, @position = line, pos
-    end
-
-    # Return a textual representation of the node.
-    def to_s
-      s = ""
-      @children.each { |child| s << child.to_s }
-      s
-    end
-
-    # Return false (subclasses must override this to provide specific matching
-    # behavior.) +conditions+ may be of any type.
-    def match(conditions)
-      false
-    end
-
-    # Search the children of this node for the first node for which #find
-    # returns non +nil+. Returns the result of the #find call that succeeded.
-    def find(conditions)
-      conditions = validate_conditions(conditions)
-      @children.each do |child|        
-        node = child.find(conditions)
-        return node if node
-      end
-      nil
-    end
-
-    # Search for all nodes that match the given conditions, and return them
-    # as an array.
-    def find_all(conditions)
-      conditions = validate_conditions(conditions)
-
-      matches = []
-      matches << self if match(conditions)
-      @children.each do |child|
-        matches.concat child.find_all(conditions)
-      end
-      matches
-    end
-
-    # Returns +false+. Subclasses may override this if they define a kind of
-    # tag.
-    def tag?
-      false
-    end
-
-    def validate_conditions(conditions)
-      Conditions === conditions ? conditions : Conditions.new(conditions)
-    end
-
-    def ==(node)
-      return false unless self.class == node.class && children.size == node.children.size
-
-      equivalent = true
-
-      children.size.times do |i|
-        equivalent &&= children[i] == node.children[i]
-      end
-
-      equivalent
-    end
-    
-    class <<self
-      def parse(parent, line, pos, content, strict=true)
-        if content !~ /^<\S/
-          Text.new(parent, line, pos, content)
-        else
-          scanner = StringScanner.new(content)
-
-          unless scanner.skip(/</)
-            if strict
-              raise "expected <"
-            else
-              return Text.new(parent, line, pos, content)
-            end
-          end
-
-          if scanner.skip(/!\[CDATA\[/)
-            scanner.scan_until(/\]\]>/)
-            return CDATA.new(parent, line, pos, scanner.pre_match.gsub(/<!\[CDATA\[/, ''))
-          end
-          
-          closing = ( scanner.scan(/\//) ? :close : nil )
-          return Text.new(parent, line, pos, content) unless name = scanner.scan(/[\w:-]+/)
-          name
-  
-          unless closing
-            scanner.skip(/\s*/)
-            attributes = {}
-            while attr = scanner.scan(/[-\w:]+/)
-              value = true
-              if scanner.scan(/\s*=\s*/)
-                if delim = scanner.scan(/['"]/)
-                  value = ""
-                  while text = scanner.scan(/[^#{delim}\\]+|./)
-                    case text
-                      when "\\" then
-                        value << text
-                        value << scanner.getch
-                      when delim
-                        break
-                      else value << text
-                    end
-                  end
-                else
-                  value = scanner.scan(/[^\s>\/]+/)
-                end
-              end
-              attributes[attr] = value
-              scanner.skip(/\s*/)
-            end
-    
-            closing = ( scanner.scan(/\//) ? :self : nil )
-          end
-          
-          unless scanner.scan(/\s*>/)
-            if strict
-              raise "expected > (got #{scanner.rest.inspect} for #{content}, #{attributes.inspect})" 
-            else
-              # throw away all text until we find what we're looking for
-              scanner.skip_until(/>/) or scanner.terminate
-            end
-          end
-
-          Tag.new(parent, line, pos, name, attributes, closing)
-        end
-      end
-    end
-  end
-
-  # A node that represents text, rather than markup.
-  class Text < Node #:nodoc:
-    
-    attr_reader :content
-    
-    # Creates a new text node as a child of the given parent, with the given
-    # content.
-    def initialize(parent, line, pos, content)
-      super(parent, line, pos)
-      @content = content
-    end
-
-    # Returns the content of this node.
-    def to_s
-      @content
-    end
-
-    # Returns +self+ if this node meets the given conditions. Text nodes support
-    # conditions of the following kinds:
-    #
-    # * if +conditions+ is a string, it must be a substring of the node's
-    #   content
-    # * if +conditions+ is a regular expression, it must match the node's
-    #   content
-    # * if +conditions+ is a hash, it must contain a <tt>:content</tt> key that
-    #   is either a string or a regexp, and which is interpreted as described
-    #   above.
-    def find(conditions)
-      match(conditions) && self
-    end
-    
-    # Returns non-+nil+ if this node meets the given conditions, or +nil+
-    # otherwise. See the discussion of #find for the valid conditions.
-    def match(conditions)
-      case conditions
-        when String
-          @content == conditions
-        when Regexp
-          @content =~ conditions
-        when Hash
-          conditions = validate_conditions(conditions)
-
-          # Text nodes only have :content, :parent, :ancestor
-          unless (conditions.keys - [:content, :parent, :ancestor]).empty?
-            return false
-          end
-
-          match(conditions[:content])
-        else
-          nil
-      end
-    end
-
-    def ==(node)
-      return false unless super
-      content == node.content
-    end
-  end
-  
-  # A CDATA node is simply a text node with a specialized way of displaying
-  # itself.
-  class CDATA < Text #:nodoc:
-    def to_s
-      "<![CDATA[#{super}]>"
-    end
-  end
-
-  # A Tag is any node that represents markup. It may be an opening tag, a
-  # closing tag, or a self-closing tag. It has a name, and may have a hash of
-  # attributes.
-  class Tag < Node #:nodoc:
-    
-    # Either +nil+, <tt>:close</tt>, or <tt>:self</tt>
-    attr_reader :closing
-    
-    # Either +nil+, or a hash of attributes for this node.
-    attr_reader :attributes
-
-    # The name of this tag.
-    attr_reader :name
-        
-    # Create a new node as a child of the given parent, using the given content
-    # to describe the node. It will be parsed and the node name, attributes and
-    # closing status extracted.
-    def initialize(parent, line, pos, name, attributes, closing)
-      super(parent, line, pos)
-      @name = name
-      @attributes = attributes
-      @closing = closing
-    end
-
-    # A convenience for obtaining an attribute of the node. Returns +nil+ if
-    # the node has no attributes.
-    def [](attr)
-      @attributes ? @attributes[attr] : nil
-    end
-
-    # Returns non-+nil+ if this tag can contain child nodes.
-    def childless?(xml = false)
-      return false if xml && @closing.nil?
-      !@closing.nil? ||
-        @name =~ /^(img|br|hr|link|meta|area|base|basefont|
-                    col|frame|input|isindex|param)$/ox
-    end
-
-    # Returns a textual representation of the node
-    def to_s
-      if @closing == :close
-        "</#{@name}>"
-      else
-        s = "<#{@name}"
-        @attributes.each do |k,v|
-          s << " #{k}"
-          s << "=\"#{v}\"" if String === v
-        end
-        s << " /" if @closing == :self
-        s << ">"
-        @children.each { |child| s << child.to_s }
-        s << "</#{@name}>" if @closing != :self && !@children.empty?
-        s
-      end
-    end
-
-    # If either the node or any of its children meet the given conditions, the
-    # matching node is returned. Otherwise, +nil+ is returned. (See the
-    # description of the valid conditions in the +match+ method.)
-    def find(conditions)
-      match(conditions) && self || super
-    end
-
-    # Returns +true+, indicating that this node represents an HTML tag.
-    def tag?
-      true
-    end
-    
-    # Returns +true+ if the node meets any of the given conditions. The
-    # +conditions+ parameter must be a hash of any of the following keys
-    # (all are optional):
-    #
-    # * <tt>:tag</tt>: the node name must match the corresponding value
-    # * <tt>:attributes</tt>: a hash. The node's values must match the
-    #   corresponding values in the hash.
-    # * <tt>:parent</tt>: a hash. The node's parent must match the
-    #   corresponding hash.
-    # * <tt>:child</tt>: a hash. At least one of the node's immediate children
-    #   must meet the criteria described by the hash.
-    # * <tt>:ancestor</tt>: a hash. At least one of the node's ancestors must
-    #   meet the criteria described by the hash.
-    # * <tt>:descendant</tt>: a hash. At least one of the node's descendants
-    #   must meet the criteria described by the hash.
-    # * <tt>:sibling</tt>: a hash. At least one of the node's siblings must
-    #   meet the criteria described by the hash.
-    # * <tt>:after</tt>: a hash. The node must be after any sibling meeting
-    #   the criteria described by the hash, and at least one sibling must match.
-    # * <tt>:before</tt>: a hash. The node must be before any sibling meeting
-    #   the criteria described by the hash, and at least one sibling must match.
-    # * <tt>:children</tt>: a hash, for counting children of a node. Accepts the
-    #   keys:
-    # ** <tt>:count</tt>: either a number or a range which must equal (or
-    #    include) the number of children that match.
-    # ** <tt>:less_than</tt>: the number of matching children must be less than
-    #    this number.
-    # ** <tt>:greater_than</tt>: the number of matching children must be
-    #    greater than this number.
-    # ** <tt>:only</tt>: another hash consisting of the keys to use
-    #    to match on the children, and only matching children will be
-    #    counted.
-    #
-    # Conditions are matched using the following algorithm:
-    #
-    # * if the condition is a string, it must be a substring of the value.
-    # * if the condition is a regexp, it must match the value.
-    # * if the condition is a number, the value must match number.to_s.
-    # * if the condition is +true+, the value must not be +nil+.
-    # * if the condition is +false+ or +nil+, the value must be +nil+.
-    #
-    # Usage:
-    #
-    #   # test if the node is a "span" tag
-    #   node.match :tag => "span"
-    #
-    #   # test if the node's parent is a "div"
-    #   node.match :parent => { :tag => "div" }
-    #
-    #   # test if any of the node's ancestors are "table" tags
-    #   node.match :ancestor => { :tag => "table" }
-    #
-    #   # test if any of the node's immediate children are "em" tags
-    #   node.match :child => { :tag => "em" }
-    #
-    #   # test if any of the node's descendants are "strong" tags
-    #   node.match :descendant => { :tag => "strong" }
-    #
-    #   # test if the node has between 2 and 4 span tags as immediate children
-    #   node.match :children => { :count => 2..4, :only => { :tag => "span" } } 
-    #
-    #   # get funky: test to see if the node is a "div", has a "ul" ancestor
-    #   # and an "li" parent (with "class" = "enum"), and whether or not it has
-    #   # a "span" descendant that contains # text matching /hello world/:
-    #   node.match :tag => "div",
-    #              :ancestor => { :tag => "ul" },
-    #              :parent => { :tag => "li",
-    #                           :attributes => { :class => "enum" } },
-    #              :descendant => { :tag => "span",
-    #                               :child => /hello world/ }
-    def match(conditions)
-      conditions = validate_conditions(conditions)
-      # check content of child nodes
-      if conditions[:content]
-        if children.empty?
-          return false unless match_condition("", conditions[:content])
-        else
-          return false unless children.find { |child| child.match(conditions[:content]) }
-        end
-      end
-
-      # test the name
-      return false unless match_condition(@name, conditions[:tag]) if conditions[:tag]
-
-      # test attributes
-      (conditions[:attributes] || {}).each do |key, value|
-        return false unless match_condition(self[key], value)
-      end
-
-      # test parent
-      return false unless parent.match(conditions[:parent]) if conditions[:parent]
-
-      # test children
-      return false unless children.find { |child| child.match(conditions[:child]) } if conditions[:child]
-   
-      # test ancestors
-      if conditions[:ancestor]
-        return false unless catch :found do
-          p = self
-          throw :found, true if p.match(conditions[:ancestor]) while p = p.parent
-        end
-      end
-
-      # test descendants
-      if conditions[:descendant]
-        return false unless children.find do |child|
-          # test the child
-          child.match(conditions[:descendant]) ||
-          # test the child's descendants
-          child.match(:descendant => conditions[:descendant])
-        end
-      end
-      
-      # count children
-      if opts = conditions[:children]
-        matches = children.select do |c|
-          (c.kind_of?(HTML::Tag) and (c.closing == :self or ! c.childless?))
-        end
-        
-        matches = matches.select { |c| c.match(opts[:only]) } if opts[:only]
-        opts.each do |key, value|
-          next if key == :only
-          case key
-            when :count
-              if Integer === value
-                return false if matches.length != value
-              else
-                return false unless value.include?(matches.length)
-              end
-            when :less_than
-              return false unless matches.length < value
-            when :greater_than
-              return false unless matches.length > value
-            else raise "unknown count condition #{key}"
-          end
-        end
-      end
-
-      # test siblings
-      if conditions[:sibling] || conditions[:before] || conditions[:after]
-        siblings = parent ? parent.children : []
-        self_index = siblings.index(self)
-
-        if conditions[:sibling]
-          return false unless siblings.detect do |s| 
-            s != self && s.match(conditions[:sibling])
-          end
-        end
-
-        if conditions[:before]
-          return false unless siblings[self_index+1..-1].detect do |s| 
-            s != self && s.match(conditions[:before])
-          end
-        end
-
-        if conditions[:after]
-          return false unless siblings[0,self_index].detect do |s| 
-            s != self && s.match(conditions[:after])
-          end
-        end
-      end
-  
-      true
-    end
-
-    def ==(node)
-      return false unless super
-      return false unless closing == node.closing && self.name == node.name
-      attributes == node.attributes
-    end
-    
-    private
-      # Match the given value to the given condition.
-      def match_condition(value, condition)
-        case condition
-          when String
-            value && value == condition
-          when Regexp
-            value && value.match(condition)
-          when Numeric
-            value == condition.to_s
-          when true
-            !value.nil?
-          when false, nil
-            value.nil?
-          else
-            false
-        end
-      end
-  end
-end
diff --git a/lib/sanitize.rb b/lib/sanitize.rb
index 0e9ca32b..69f8e3e7 100644
--- a/lib/sanitize.rb
+++ b/lib/sanitize.rb
@@ -1,207 +1,26 @@
 module Sanitize
 
-# This module provides sanitization of XHTML+MathML+SVG
+# This module provides sanitization of XHTML+MathML+SVG 
 # and of inline style attributes.
 #
-# Based heavily on Sam Ruby's code in the Universal FeedParser.
-
-  require 'html/tokenizer'
-  require 'node'
-
-  acceptable_elements = ['a', 'abbr', 'acronym', 'address', 'area', 'b',
-      'big', 'blockquote', 'br', 'button', 'caption', 'center', 'cite',
-      'code', 'col', 'colgroup', 'dd', 'del', 'dfn', 'dir', 'div', 'dl', 'dt',
-      'em', 'fieldset', 'font', 'form', 'h1', 'h2', 'h3', 'h4', 'h5', 'h6',
-      'hr', 'i', 'img', 'input', 'ins', 'kbd', 'label', 'legend', 'li', 'map',
-      'menu', 'ol', 'optgroup', 'option', 'p', 'pre', 'q', 's', 'samp',
-      'select', 'small', 'span', 'strike', 'strong', 'sub', 'sup', 'table',
-      'tbody', 'td', 'textarea', 'tfoot', 'th', 'thead', 'tr', 'tt', 'u',
-      'ul', 'var']
-      
-  mathml_elements = ['maction', 'math', 'merror', 'mfrac', 'mi',
-      'mmultiscripts', 'mn', 'mo', 'mover', 'mpadded', 'mphantom',
-      'mprescripts', 'mroot', 'mrow', 'mspace', 'msqrt', 'mstyle', 'msub',
-      'msubsup', 'msup', 'mtable', 'mtd', 'mtext', 'mtr', 'munder',
-      'munderover', 'none']
-      
-  svg_elements = ['a', 'animate', 'animateColor', 'animateMotion',
-      'animateTransform', 'circle', 'defs', 'desc', 'ellipse', 'font-face',
-      'font-face-name', 'font-face-src', 'g', 'glyph', 'hkern', 'image',
-      'linearGradient', 'line', 'marker', 'metadata', 'missing-glyph',
-      'mpath', 'path', 'polygon', 'polyline', 'radialGradient', 'rect',
-      'set', 'stop', 'svg', 'switch', 'text', 'title', 'tspan', 'use']
-      
-  acceptable_attributes = ['abbr', 'accept', 'accept-charset', 'accesskey',
-      'action', 'align', 'alt', 'axis', 'border', 'cellpadding',
-      'cellspacing', 'char', 'charoff', 'charset', 'checked', 'cite', 'class',
-      'clear', 'cols', 'colspan', 'color', 'compact', 'coords', 'datetime',
-      'dir', 'disabled', 'enctype', 'for', 'frame', 'headers', 'height',
-      'href', 'hreflang', 'hspace', 'id', 'ismap', 'label', 'lang',
-      'longdesc', 'maxlength', 'media', 'method', 'multiple', 'name',
-      'nohref', 'noshade', 'nowrap', 'prompt', 'readonly', 'rel', 'rev',
-      'rows', 'rowspan', 'rules', 'scope', 'selected', 'shape', 'size',
-      'span', 'src', 'start', 'style', 'summary', 'tabindex', 'target', 'title',
-      'type', 'usemap', 'valign', 'value', 'vspace', 'width', 'xml:lang']
+# Uses the HTML5lib parser, so that the parsing behaviour should
+# resemble that of browsers.
+#
+#  sanitize_xhtml() is a case-sensitive sanitizer, suitable for XHTML
+#  sanitize_html() is a case-insensitive sanitizer suitable for HTML
 
 
-  mathml_attributes = ['actiontype', 'align', 'columnalign', 'columnalign',
-      'columnalign', 'columnlines', 'columnspacing', 'columnspan', 'depth',
-      'display', 'displaystyle', 'equalcolumns', 'equalrows', 'fence',
-      'fontstyle', 'fontweight', 'frame', 'height', 'linethickness', 'lspace',
-      'mathbackground', 'mathcolor', 'mathvariant', 'mathvariant', 'maxsize',
-      'minsize', 'other', 'rowalign', 'rowalign', 'rowalign', 'rowlines',
-      'rowspacing', 'rowspan', 'rspace', 'scriptlevel', 'selection',
-      'separator', 'stretchy', 'width', 'width', 'xlink:href', 'xlink:show',
-      'xlink:type', 'xmlns', 'xmlns:xlink']
+  require 'html5lib/sanitizer'
+  require 'html5lib/html5parser'
+  require 'html5lib/liberalxmlparser'
+  include HTML5lib
 
-      
-  svg_attributes = ['accent-height', 'accumulate', 'additive', 'alphabetic',
-       'arabic-form', 'ascent', 'attributeName', 'attributeType',
-       'baseProfile', 'bbox', 'begin', 'by', 'calcMode', 'cap-height',
-       'class', 'color', 'color-rendering', 'content', 'cx', 'cy', 'd', 'dx',
-       'dy', 'descent', 'display', 'dur', 'end', 'fill', 'fill-rule',
-       'font-family', 'font-size', 'font-stretch', 'font-style', 'font-variant',
-       'font-weight', 'from', 'fx', 'fy', 'g1', 'g2', 'glyph-name', 
-       'gradientUnits', 'hanging', 'height', 'horiz-adv-x', 'horiz-origin-x',
-       'id', 'ideographic', 'k', 'keyPoints', 'keySplines', 'keyTimes',
-       'lang', 'marker-end', 'marker-mid', 'marker-start', 'markerHeight',
-       'markerUnits', 'markerWidth', 'mathematical', 'max', 'min', 'name',
-       'offset', 'opacity', 'orient', 'origin', 'overline-position',
-       'overline-thickness', 'panose-1', 'path', 'pathLength', 'points',
-       'preserveAspectRatio', 'r', 'refX', 'refY', 'repeatCount', 'repeatDur',
-       'requiredExtensions', 'requiredFeatures', 'restart', 'rotate', 'rx',
-       'ry', 'slope', 'stemh', 'stemv', 'stop-color', 'stop-opacity',
-       'strikethrough-position', 'strikethrough-thickness', 'stroke',
-       'stroke-dasharray', 'stroke-dashoffset', 'stroke-linecap',
-       'stroke-linejoin', 'stroke-miterlimit', 'stroke-opacity',
-       'stroke-width', 'systemLanguage', 'target',
-       'text-anchor', 'to', 'transform', 'type', 'u1', 'u2',
-       'underline-position', 'underline-thickness', 'unicode',
-       'unicode-range', 'units-per-em', 'values', 'version', 'viewBox',
-       'visibility', 'width', 'widths', 'x', 'x-height', 'x1', 'x2',
-       'xlink:actuate', 'xlink:arcrole', 'xlink:href', 'xlink:role',
-       'xlink:show', 'xlink:title', 'xlink:type', 'xml:base', 'xml:lang',
-       'xml:space', 'xmlns', 'xmlns:xlink', 'y', 'y1', 'y2', 'zoomAndPan']
+  def sanitize_xhtml(html)
+    XHTMLParser.parseFragment(html, :tokenizer => HTMLSanitizer).to_s
+  end
 
-  attr_val_is_uri = ['href', 'src', 'cite', 'action', 'longdesc', 'xlink:href']
-  
-  acceptable_css_properties = ['azimuth', 'background-color',
-      'border-bottom-color', 'border-collapse', 'border-color',
-      'border-left-color', 'border-right-color', 'border-top-color', 'clear',
-      'color', 'cursor', 'direction', 'display', 'elevation', 'float', 'font',
-      'font-family', 'font-size', 'font-style', 'font-variant', 'font-weight',
-      'height', 'letter-spacing', 'line-height', 'overflow', 'pause',
-      'pause-after', 'pause-before', 'pitch', 'pitch-range', 'richness',
-      'speak', 'speak-header', 'speak-numeral', 'speak-punctuation',
-      'speech-rate', 'stress', 'text-align', 'text-decoration', 'text-indent',
-      'unicode-bidi', 'vertical-align', 'voice-family', 'volume',
-      'white-space', 'width']
+  def sanitize_html(html)
+    HTMLParser.parseFragment(html, :tokenizer => HTMLSanitizer).to_s
+  end
 
-  acceptable_css_keywords = ['auto', 'aqua', 'black', 'block', 'blue',
-      'bold', 'both', 'bottom', 'brown', 'center', 'collapse', 'dashed',
-      'dotted', 'fuchsia', 'gray', 'green', '!important', 'italic', 'left',
-      'lime', 'maroon', 'medium', 'none', 'navy', 'normal', 'nowrap', 'olive',
-      'pointer', 'purple', 'red', 'right', 'solid', 'silver', 'teal', 'top',
-      'transparent', 'underline', 'white', 'yellow']
-
-  acceptable_svg_properties = [ 'fill', 'fill-opacity', 'fill-rule',
-      'stroke', 'stroke-width', 'stroke-linecap', 'stroke-linejoin',
-      'stroke-opacity']
-
-  acceptable_protocols = [ 'ed2k', 'ftp', 'http', 'https', 'irc',
-      'mailto', 'news', 'gopher', 'nntp', 'telnet', 'webcal',
-      'xmpp', 'callto', 'feed', 'urn', 'aim', 'rsync', 'tag',
-      'ssh', 'sftp', 'rtsp', 'afs' ]
-
-      ALLOWED_ELEMENTS = acceptable_elements + mathml_elements + svg_elements  unless defined?(ALLOWED_ELEMENTS)
-      ALLOWED_ATTRIBUTES = acceptable_attributes + mathml_attributes + svg_attributes unless defined?(ALLOWED_ATTRIBUTES)
-      ALLOWED_CSS_PROPERTIES = acceptable_css_properties unless defined?(ALLOWED_CSS_PROPERTIES)
-      ALLOWED_CSS_KEYWORDS = acceptable_css_keywords unless defined?(ALLOWED_CSS_KEYWORDS)
-      ALLOWED_SVG_PROPERTIES = acceptable_svg_properties unless defined?(ALLOWED_SVG_PROPERTIES)
-      ALLOWED_PROTOCOLS = acceptable_protocols unless defined?(ALLOWED_PROTOCOLS)
-      ATTR_VAL_IS_URI = attr_val_is_uri unless defined?(ATTR_VAL_IS_URI)
-
-      # Sanitize the +html+, escaping all elements not in ALLOWED_ELEMENTS, and stripping out all
-      # attributes not in ALLOWED_ATTRIBUTES. Style attributes are parsed, and a restricted set,
-      # specified by ALLOWED_CSS_PROPERTIES and ALLOWED_CSS_KEYWORDS, are allowed through.
-      # attributes in ATTR_VAL_IS_URI are scanned, and only URI schemes specified in
-      # ALLOWED_PROTOCOLS are allowed.
-      # You can adjust what gets sanitized, by defining these constant arrays before this Module is loaded. 
-      #
-      #   sanitize_html('<script> do_nasty_stuff() </script>')
-      #    => &lt;script> do_nasty_stuff() &lt;/script>
-      #   sanitize_html('<a href="javascript: sucker();">Click here for $100</a>')
-      #    => <a>Click here for $100</a>
-      def sanitize_xhtml(html)
-        if html.index("<")
-          tokenizer = HTML::Tokenizer.new(html)
-          new_text = ""
-
-          while token = tokenizer.next
-            node = XHTML::Node.parse(nil, 0, 0, token, false)
-            new_text << case node.tag?
-              when true
-                if ALLOWED_ELEMENTS.include?(node.name)
-                  if node.closing != :close
-                    node.attributes.delete_if { |attr,v| !ALLOWED_ATTRIBUTES.include?(attr) }
-                    ATTR_VAL_IS_URI.each do |attr|
-                      val_unescaped = CGI.unescapeHTML(node.attributes[attr].to_s).gsub(/[\000-\040\177\s]+|\302*[\200-\240]/,'').downcase
-                      if val_unescaped =~ /^[a-z0-9][-+.a-z0-9]*:/ and !ALLOWED_PROTOCOLS.include?(val_unescaped.split(':')[0]) 
-                        node.attributes.delete attr 
-                      end
-                    end
-                    if node.attributes['style']
-                      node.attributes['style'] = sanitize_css(node.attributes['style']) 
-                    end
-                  end
-                  node.to_s
-                else
-                  node.to_s.gsub(/</, "&lt;")
-                end
-              else
-                node.to_s.gsub(/</, "&lt;")
-            end
-          end
-
-          html = new_text
-        end
-        html
-      end
-      
-      def sanitize_css(style)
-          # disallow urls
-          style = style.to_s.gsub(/url\s*\(\s*[^\s)]+?\s*\)\s*/, ' ')
-
-          # gauntlet
-          if style !~ /^([:,;#%.\sa-zA-Z0-9!]|\w-\w|\'[\s\w]+\'|\"[\s\w]+\"|\([\d,\s]+\))*$/
-             style = ''
-             return style
-          end
-          if style !~ /^(\s*[-\w]+\s*:\s*[^:;]*(;|$))*$/
-             style = ''
-             return style
-          end
-
-          clean = []
-          style.scan(/([-\w]+)\s*:\s*([^:;]*)/) do |prop,val|
-            if ALLOWED_CSS_PROPERTIES.include?(prop.downcase)
-              clean <<  prop + ': ' + val + ';'
-            elsif ['background','border','margin','padding'].include?(prop.split('-')[0].downcase) 
-              goodval = true
-              val.split().each do |keyword|
-                if !ALLOWED_CSS_KEYWORDS.include?(keyword) and 
-                   keyword !~ /^(#[0-9a-f]+|rgb\(\d+%?,\d*%?,?\d*%?\)?|\d{0,2}\.?\d{0,2}(cm|em|ex|in|mm|pc|pt|px|%|,|\))?)$/
-                  goodval = false
-                end
-              end
-              if goodval 
-                clean <<  prop + ': ' + val + ';'
-              end
-            elsif ALLOWED_SVG_PROPERTIES.include?(prop.downcase)
-               clean <<  prop + ': ' + val + ';'
-            end
-          end
-
-          style = clean.join(' ')
-      end
-end      
+end
diff --git a/vendor/plugins/HTML5lib/Rakefile.rb b/vendor/plugins/HTML5lib/Rakefile.rb
index 36c4692b..90a72824 100644
--- a/vendor/plugins/HTML5lib/Rakefile.rb
+++ b/vendor/plugins/HTML5lib/Rakefile.rb
@@ -2,6 +2,6 @@ require 'rake'
 require 'rake/testtask'
 
 Rake::TestTask.new do |task|
-	task.pattern = 'tests/test_*.rb'
-	task.verbose = true
+  task.pattern = 'tests/test_*.rb'
+  task.verbose = true
 end
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/constants.rb b/vendor/plugins/HTML5lib/lib/html5lib/constants.rb
index 67bc2f96..c0c3dc3f 100755
--- a/vendor/plugins/HTML5lib/lib/html5lib/constants.rb
+++ b/vendor/plugins/HTML5lib/lib/html5lib/constants.rb
@@ -1,676 +1,676 @@
 module HTML5lib
 
-class EOF < Exception; end
+  class EOF < Exception; end
 
-CONTENT_MODEL_FLAGS = [
-    :PCDATA,
-    :RCDATA,
-    :CDATA,
-    :PLAINTEXT
-]
+  CONTENT_MODEL_FLAGS = [
+      :PCDATA,
+      :RCDATA,
+      :CDATA,
+      :PLAINTEXT
+  ]
 
-SCOPING_ELEMENTS = %w[
-    button
-    caption
-    html
-    marquee
-    object
-    table
-    td
-    th
-]
+  SCOPING_ELEMENTS = %w[
+      button
+      caption
+      html
+      marquee
+      object
+      table
+      td
+      th
+  ]
 
-FORMATTING_ELEMENTS = %w[
-    a
-    b
-    big
-    em
-    font
-    i
-    nobr
-    s
-    small
-    strike
-    strong
-    tt
-    u
-]
+  FORMATTING_ELEMENTS = %w[
+      a
+      b
+      big
+      em
+      font
+      i
+      nobr
+      s
+      small
+      strike
+      strong
+      tt
+      u
+  ]
 
-SPECIAL_ELEMENTS = %w[
-    address
-    area
-    base
-    basefont
-    bgsound
-    blockquote
-    body
-    br
-    center
-    col
-    colgroup
-    dd
-    dir
-    div
-    dl
-    dt
-    embed
-    fieldset
-    form
-    frame
-    frameset
-    h1
-    h2
-    h3
-    h4
-    h5
-    h6
-    head
-    hr
-    iframe
-    image
-    img
-    input
-    isindex
-    li
-    link
-    listing
-    menu
-    meta
-    noembed
-    noframes
-    noscript
-    ol
-    optgroup
-    option
-    p
-    param
-    plaintext
-    pre
-    script
-    select
-    spacer
-    style
-    tbody
-    textarea
-    tfoot
-    thead
-    title
-    tr
-    ul
-    wbr
-]
+  SPECIAL_ELEMENTS = %w[
+      address
+      area
+      base
+      basefont
+      bgsound
+      blockquote
+      body
+      br
+      center
+      col
+      colgroup
+      dd
+      dir
+      div
+      dl
+      dt
+      embed
+      fieldset
+      form
+      frame
+      frameset
+      h1
+      h2
+      h3
+      h4
+      h5
+      h6
+      head
+      hr
+      iframe
+      image
+      img
+      input
+      isindex
+      li
+      link
+      listing
+      menu
+      meta
+      noembed
+      noframes
+      noscript
+      ol
+      optgroup
+      option
+      p
+      param
+      plaintext
+      pre
+      script
+      select
+      spacer
+      style
+      tbody
+      textarea
+      tfoot
+      thead
+      title
+      tr
+      ul
+      wbr
+  ]
 
-SPACE_CHARACTERS = %W[
-    \t
-    \n
-    \x0B
-    \x0C
-    \x20
-    \r
-]
+  SPACE_CHARACTERS = %W[
+      \t
+      \n
+      \x0B
+      \x0C
+      \x20
+      \r
+  ]
 
-TABLE_INSERT_MODE_ELEMENTS = %w[
-    table
-    tbody
-    tfoot
-    thead
-    tr
-]
+  TABLE_INSERT_MODE_ELEMENTS = %w[
+      table
+      tbody
+      tfoot
+      thead
+      tr
+  ]
 
-ASCII_LOWERCASE = ('a'..'z').to_a.join('')
-ASCII_UPPERCASE = ('A'..'Z').to_a.join('')
-ASCII_LETTERS = ASCII_LOWERCASE + ASCII_UPPERCASE
-DIGITS = '0'..'9'
-HEX_DIGITS = DIGITS.to_a + ('a'..'f').to_a + ('A'..'F').to_a
+  ASCII_LOWERCASE = ('a'..'z').to_a.join('')
+  ASCII_UPPERCASE = ('A'..'Z').to_a.join('')
+  ASCII_LETTERS = ASCII_LOWERCASE + ASCII_UPPERCASE
+  DIGITS = '0'..'9'
+  HEX_DIGITS = DIGITS.to_a + ('a'..'f').to_a + ('A'..'F').to_a
 
-# Heading elements need to be ordered 
-HEADING_ELEMENTS = %w[
-    h1
-    h2
-    h3
-    h4
-    h5
-    h6
-]
+  # Heading elements need to be ordered 
+  HEADING_ELEMENTS = %w[
+      h1
+      h2
+      h3
+      h4
+      h5
+      h6
+  ]
 
-# XXX What about event-source and command?
-VOID_ELEMENTS = %w[
-    base
-    link
-    meta
-    hr
-    br
-    img
-    embed
-    param
-    area
-    col
-    input
-]
+  # XXX What about event-source and command?
+  VOID_ELEMENTS = %w[
+      base
+      link
+      meta
+      hr
+      br
+      img
+      embed
+      param
+      area
+      col
+      input
+  ]
 
-# entitiesWindows1252 has to be _ordered_ and needs to have an index.
-ENTITIES_WINDOWS1252 = [
-    8364,  # 0x80  0x20AC  EURO SIGN
-    65533, # 0x81          UNDEFINED
-    8218,  # 0x82  0x201A  SINGLE LOW-9 QUOTATION MARK
-    402,   # 0x83  0x0192  LATIN SMALL LETTER F WITH HOOK
-    8222,  # 0x84  0x201E  DOUBLE LOW-9 QUOTATION MARK
-    8230,  # 0x85  0x2026  HORIZONTAL ELLIPSIS
-    8224,  # 0x86  0x2020  DAGGER
-    8225,  # 0x87  0x2021  DOUBLE DAGGER
-    710,   # 0x88  0x02C6  MODIFIER LETTER CIRCUMFLEX ACCENT
-    8240,  # 0x89  0x2030  PER MILLE SIGN
-    352,   # 0x8A  0x0160  LATIN CAPITAL LETTER S WITH CARON
-    8249,  # 0x8B  0x2039  SINGLE LEFT-POINTING ANGLE QUOTATION MARK
-    338,   # 0x8C  0x0152  LATIN CAPITAL LIGATURE OE
-    65533, # 0x8D          UNDEFINED
-    381,   # 0x8E  0x017D  LATIN CAPITAL LETTER Z WITH CARON
-    65533, # 0x8F          UNDEFINED
-    65533, # 0x90          UNDEFINED
-    8216,  # 0x91  0x2018  LEFT SINGLE QUOTATION MARK
-    8217,  # 0x92  0x2019  RIGHT SINGLE QUOTATION MARK
-    8220,  # 0x93  0x201C  LEFT DOUBLE QUOTATION MARK
-    8221,  # 0x94  0x201D  RIGHT DOUBLE QUOTATION MARK
-    8226,  # 0x95  0x2022  BULLET
-    8211,  # 0x96  0x2013  EN DASH
-    8212,  # 0x97  0x2014  EM DASH
-    732,   # 0x98  0x02DC  SMALL TILDE
-    8482,  # 0x99  0x2122  TRADE MARK SIGN
-    353,   # 0x9A  0x0161  LATIN SMALL LETTER S WITH CARON
-    8250,  # 0x9B  0x203A  SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
-    339,   # 0x9C  0x0153  LATIN SMALL LIGATURE OE
-    65533, # 0x9D          UNDEFINED
-    382,   # 0x9E  0x017E  LATIN SMALL LETTER Z WITH CARON
-    376    # 0x9F  0x0178  LATIN CAPITAL LETTER Y WITH DIAERESIS
-]
+  # entitiesWindows1252 has to be _ordered_ and needs to have an index.
+  ENTITIES_WINDOWS1252 = [
+      8364,  # 0x80  0x20AC  EURO SIGN
+      65533, # 0x81          UNDEFINED
+      8218,  # 0x82  0x201A  SINGLE LOW-9 QUOTATION MARK
+      402,   # 0x83  0x0192  LATIN SMALL LETTER F WITH HOOK
+      8222,  # 0x84  0x201E  DOUBLE LOW-9 QUOTATION MARK
+      8230,  # 0x85  0x2026  HORIZONTAL ELLIPSIS
+      8224,  # 0x86  0x2020  DAGGER
+      8225,  # 0x87  0x2021  DOUBLE DAGGER
+      710,   # 0x88  0x02C6  MODIFIER LETTER CIRCUMFLEX ACCENT
+      8240,  # 0x89  0x2030  PER MILLE SIGN
+      352,   # 0x8A  0x0160  LATIN CAPITAL LETTER S WITH CARON
+      8249,  # 0x8B  0x2039  SINGLE LEFT-POINTING ANGLE QUOTATION MARK
+      338,   # 0x8C  0x0152  LATIN CAPITAL LIGATURE OE
+      65533, # 0x8D          UNDEFINED
+      381,   # 0x8E  0x017D  LATIN CAPITAL LETTER Z WITH CARON
+      65533, # 0x8F          UNDEFINED
+      65533, # 0x90          UNDEFINED
+      8216,  # 0x91  0x2018  LEFT SINGLE QUOTATION MARK
+      8217,  # 0x92  0x2019  RIGHT SINGLE QUOTATION MARK
+      8220,  # 0x93  0x201C  LEFT DOUBLE QUOTATION MARK
+      8221,  # 0x94  0x201D  RIGHT DOUBLE QUOTATION MARK
+      8226,  # 0x95  0x2022  BULLET
+      8211,  # 0x96  0x2013  EN DASH
+      8212,  # 0x97  0x2014  EM DASH
+      732,   # 0x98  0x02DC  SMALL TILDE
+      8482,  # 0x99  0x2122  TRADE MARK SIGN
+      353,   # 0x9A  0x0161  LATIN SMALL LETTER S WITH CARON
+      8250,  # 0x9B  0x203A  SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
+      339,   # 0x9C  0x0153  LATIN SMALL LIGATURE OE
+      65533, # 0x9D          UNDEFINED
+      382,   # 0x9E  0x017E  LATIN SMALL LETTER Z WITH CARON
+      376    # 0x9F  0x0178  LATIN CAPITAL LETTER Y WITH DIAERESIS
+  ]
 
-private
+  private
 
-  def self.U n
-    [n].pack('U')
-  end
+    def self.U n
+      [n].pack('U')
+    end
 
-public
+  public
 
-ENTITIES = {
-    "AElig" => U(0xC6),
-    "Aacute" => U(0xC1),
-    "Acirc" => U(0xC2),
-    "Agrave" => U(0xC0),
-    "Alpha" => U(0x0391),
-    "Aring" => U(0xC5),
-    "Atilde" => U(0xC3),
-    "Auml" => U(0xC4),
-    "Beta" => U(0x0392),
-    "Ccedil" => U(0xC7),
-    "Chi" => U(0x03A7),
-    "Dagger" => U(0x2021),
-    "Delta" => U(0x0394),
-    "ETH" => U(0xD0),
-    "Eacute" => U(0xC9),
-    "Ecirc" => U(0xCA),
-    "Egrave" => U(0xC8),
-    "Epsilon" => U(0x0395),
-    "Eta" => U(0x0397),
-    "Euml" => U(0xCB),
-    "Gamma" => U(0x0393),
-    "Iacute" => U(0xCD),
-    "Icirc" => U(0xCE),
-    "Igrave" => U(0xCC),
-    "Iota" => U(0x0399),
-    "Iuml" => U(0xCF),
-    "Kappa" => U(0x039A),
-    "Lambda" => U(0x039B),
-    "Mu" => U(0x039C),
-    "Ntilde" => U(0xD1),
-    "Nu" => U(0x039D),
-    "OElig" => U(0x0152),
-    "Oacute" => U(0xD3),
-    "Ocirc" => U(0xD4),
-    "Ograve" => U(0xD2),
-    "Omega" => U(0x03A9),
-    "Omicron" => U(0x039F),
-    "Oslash" => U(0xD8),
-    "Otilde" => U(0xD5),
-    "Ouml" => U(0xD6),
-    "Phi" => U(0x03A6),
-    "Pi" => U(0x03A0),
-    "Prime" => U(0x2033),
-    "Psi" => U(0x03A8),
-    "Rho" => U(0x03A1),
-    "Scaron" => U(0x0160),
-    "Sigma" => U(0x03A3),
-    "THORN" => U(0xDE),
-    "Tau" => U(0x03A4),
-    "Theta" => U(0x0398),
-    "Uacute" => U(0xDA),
-    "Ucirc" => U(0xDB),
-    "Ugrave" => U(0xD9),
-    "Upsilon" => U(0x03A5),
-    "Uuml" => U(0xDC),
-    "Xi" => U(0x039E),
-    "Yacute" => U(0xDD),
-    "Yuml" => U(0x0178),
-    "Zeta" => U(0x0396),
-    "aacute" => U(0xE1),
-    "acirc" => U(0xE2),
-    "acute" => U(0xB4),
-    "aelig" => U(0xE6),
-    "agrave" => U(0xE0),
-    "alefsym" => U(0x2135),
-    "alpha" => U(0x03B1),
-    "amp" => U(0x26),
-    "AMP" => U(0x26),
-    "and" => U(0x2227),
-    "ang" => U(0x2220),
-    "apos" => U(0x27),
-    "aring" => U(0xE5),
-    "asymp" => U(0x2248),
-    "atilde" => U(0xE3),
-    "auml" => U(0xE4),
-    "bdquo" => U(0x201E),
-    "beta" => U(0x03B2),
-    "brvbar" => U(0xA6),
-    "bull" => U(0x2022),
-    "cap" => U(0x2229),
-    "ccedil" => U(0xE7),
-    "cedil" => U(0xB8),
-    "cent" => U(0xA2),
-    "chi" => U(0x03C7),
-    "circ" => U(0x02C6),
-    "clubs" => U(0x2663),
-    "cong" => U(0x2245),
-    "copy" => U(0xA9),
-    "COPY" => U(0xA9),
-    "crarr" => U(0x21B5),
-    "cup" => U(0x222A),
-    "curren" => U(0xA4),
-    "dArr" => U(0x21D3),
-    "dagger" => U(0x2020),
-    "darr" => U(0x2193),
-    "deg" => U(0xB0),
-    "delta" => U(0x03B4),
-    "diams" => U(0x2666),
-    "divide" => U(0xF7),
-    "eacute" => U(0xE9),
-    "ecirc" => U(0xEA),
-    "egrave" => U(0xE8),
-    "empty" => U(0x2205),
-    "emsp" => U(0x2003),
-    "ensp" => U(0x2002),
-    "epsilon" => U(0x03B5),
-    "equiv" => U(0x2261),
-    "eta" => U(0x03B7),
-    "eth" => U(0xF0),
-    "euml" => U(0xEB),
-    "euro" => U(0x20AC),
-    "exist" => U(0x2203),
-    "fnof" => U(0x0192),
-    "forall" => U(0x2200),
-    "frac12" => U(0xBD),
-    "frac14" => U(0xBC),
-    "frac34" => U(0xBE),
-    "frasl" => U(0x2044),
-    "gamma" => U(0x03B3),
-    "ge" => U(0x2265),
-    "gt" => U(0x3E),
-    "GT" => U(0x3E),
-    "hArr" => U(0x21D4),
-    "harr" => U(0x2194),
-    "hearts" => U(0x2665),
-    "hellip" => U(0x2026),
-    "iacute" => U(0xED),
-    "icirc" => U(0xEE),
-    "iexcl" => U(0xA1),
-    "igrave" => U(0xEC),
-    "image" => U(0x2111),
-    "infin" => U(0x221E),
-    "int" => U(0x222B),
-    "iota" => U(0x03B9),
-    "iquest" => U(0xBF),
-    "isin" => U(0x2208),
-    "iuml" => U(0xEF),
-    "kappa" => U(0x03BA),
-    "lArr" => U(0x21D0),
-    "lambda" => U(0x03BB),
-    "lang" => U(0x2329),
-    "laquo" => U(0xAB),
-    "larr" => U(0x2190),
-    "lceil" => U(0x2308),
-    "ldquo" => U(0x201C),
-    "le" => U(0x2264),
-    "lfloor" => U(0x230A),
-    "lowast" => U(0x2217),
-    "loz" => U(0x25CA),
-    "lrm" => U(0x200E),
-    "lsaquo" => U(0x2039),
-    "lsquo" => U(0x2018),
-    "lt" => U(0x3C),
-    "LT" => U(0x3C),
-    "macr" => U(0xAF),
-    "mdash" => U(0x2014),
-    "micro" => U(0xB5),
-    "middot" => U(0xB7),
-    "minus" => U(0x2212),
-    "mu" => U(0x03BC),
-    "nabla" => U(0x2207),
-    "nbsp" => U(0xA0),
-    "ndash" => U(0x2013),
-    "ne" => U(0x2260),
-    "ni" => U(0x220B),
-    "not" => U(0xAC),
-    "notin" => U(0x2209),
-    "nsub" => U(0x2284),
-    "ntilde" => U(0xF1),
-    "nu" => U(0x03BD),
-    "oacute" => U(0xF3),
-    "ocirc" => U(0xF4),
-    "oelig" => U(0x0153),
-    "ograve" => U(0xF2),
-    "oline" => U(0x203E),
-    "omega" => U(0x03C9),
-    "omicron" => U(0x03BF),
-    "oplus" => U(0x2295),
-    "or" => U(0x2228),
-    "ordf" => U(0xAA),
-    "ordm" => U(0xBA),
-    "oslash" => U(0xF8),
-    "otilde" => U(0xF5),
-    "otimes" => U(0x2297),
-    "ouml" => U(0xF6),
-    "para" => U(0xB6),
-    "part" => U(0x2202),
-    "permil" => U(0x2030),
-    "perp" => U(0x22A5),
-    "phi" => U(0x03C6),
-    "pi" => U(0x03C0),
-    "piv" => U(0x03D6),
-    "plusmn" => U(0xB1),
-    "pound" => U(0xA3),
-    "prime" => U(0x2032),
-    "prod" => U(0x220F),
-    "prop" => U(0x221D),
-    "psi" => U(0x03C8),
-    "quot" => U(0x22),
-    "QUOT" => U(0x22),
-    "rArr" => U(0x21D2),
-    "radic" => U(0x221A),
-    "rang" => U(0x232A),
-    "raquo" => U(0xBB),
-    "rarr" => U(0x2192),
-    "rceil" => U(0x2309),
-    "rdquo" => U(0x201D),
-    "real" => U(0x211C),
-    "reg" => U(0xAE),
-    "REG" => U(0xAE),
-    "rfloor" => U(0x230B),
-    "rho" => U(0x03C1),
-    "rlm" => U(0x200F),
-    "rsaquo" => U(0x203A),
-    "rsquo" => U(0x2019),
-    "sbquo" => U(0x201A),
-    "scaron" => U(0x0161),
-    "sdot" => U(0x22C5),
-    "sect" => U(0xA7),
-    "shy" => U(0xAD),
-    "sigma" => U(0x03C3),
-    "sigmaf" => U(0x03C2),
-    "sim" => U(0x223C),
-    "spades" => U(0x2660),
-    "sub" => U(0x2282),
-    "sube" => U(0x2286),
-    "sum" => U(0x2211),
-    "sup" => U(0x2283),
-    "sup1" => U(0xB9),
-    "sup2" => U(0xB2),
-    "sup3" => U(0xB3),
-    "supe" => U(0x2287),
-    "szlig" => U(0xDF),
-    "tau" => U(0x03C4),
-    "there4" => U(0x2234),
-    "theta" => U(0x03B8),
-    "thetasym" => U(0x03D1),
-    "thinsp" => U(0x2009),
-    "thorn" => U(0xFE),
-    "tilde" => U(0x02DC),
-    "times" => U(0xD7),
-    "trade" => U(0x2122),
-    "uArr" => U(0x21D1),
-    "uacute" => U(0xFA),
-    "uarr" => U(0x2191),
-    "ucirc" => U(0xFB),
-    "ugrave" => U(0xF9),
-    "uml" => U(0xA8),
-    "upsih" => U(0x03D2),
-    "upsilon" => U(0x03C5),
-    "uuml" => U(0xFC),
-    "weierp" => U(0x2118),
-    "xi" => U(0x03BE),
-    "yacute" => U(0xFD),
-    "yen" => U(0xA5),
-    "yuml" => U(0xFF),
-    "zeta" => U(0x03B6),
-    "zwj" => U(0x200D),
-    "zwnj" => U(0x200C)
-}
+  ENTITIES = {
+      "AElig" => U(0xC6),
+      "Aacute" => U(0xC1),
+      "Acirc" => U(0xC2),
+      "Agrave" => U(0xC0),
+      "Alpha" => U(0x0391),
+      "Aring" => U(0xC5),
+      "Atilde" => U(0xC3),
+      "Auml" => U(0xC4),
+      "Beta" => U(0x0392),
+      "Ccedil" => U(0xC7),
+      "Chi" => U(0x03A7),
+      "Dagger" => U(0x2021),
+      "Delta" => U(0x0394),
+      "ETH" => U(0xD0),
+      "Eacute" => U(0xC9),
+      "Ecirc" => U(0xCA),
+      "Egrave" => U(0xC8),
+      "Epsilon" => U(0x0395),
+      "Eta" => U(0x0397),
+      "Euml" => U(0xCB),
+      "Gamma" => U(0x0393),
+      "Iacute" => U(0xCD),
+      "Icirc" => U(0xCE),
+      "Igrave" => U(0xCC),
+      "Iota" => U(0x0399),
+      "Iuml" => U(0xCF),
+      "Kappa" => U(0x039A),
+      "Lambda" => U(0x039B),
+      "Mu" => U(0x039C),
+      "Ntilde" => U(0xD1),
+      "Nu" => U(0x039D),
+      "OElig" => U(0x0152),
+      "Oacute" => U(0xD3),
+      "Ocirc" => U(0xD4),
+      "Ograve" => U(0xD2),
+      "Omega" => U(0x03A9),
+      "Omicron" => U(0x039F),
+      "Oslash" => U(0xD8),
+      "Otilde" => U(0xD5),
+      "Ouml" => U(0xD6),
+      "Phi" => U(0x03A6),
+      "Pi" => U(0x03A0),
+      "Prime" => U(0x2033),
+      "Psi" => U(0x03A8),
+      "Rho" => U(0x03A1),
+      "Scaron" => U(0x0160),
+      "Sigma" => U(0x03A3),
+      "THORN" => U(0xDE),
+      "Tau" => U(0x03A4),
+      "Theta" => U(0x0398),
+      "Uacute" => U(0xDA),
+      "Ucirc" => U(0xDB),
+      "Ugrave" => U(0xD9),
+      "Upsilon" => U(0x03A5),
+      "Uuml" => U(0xDC),
+      "Xi" => U(0x039E),
+      "Yacute" => U(0xDD),
+      "Yuml" => U(0x0178),
+      "Zeta" => U(0x0396),
+      "aacute" => U(0xE1),
+      "acirc" => U(0xE2),
+      "acute" => U(0xB4),
+      "aelig" => U(0xE6),
+      "agrave" => U(0xE0),
+      "alefsym" => U(0x2135),
+      "alpha" => U(0x03B1),
+      "amp" => U(0x26),
+      "AMP" => U(0x26),
+      "and" => U(0x2227),
+      "ang" => U(0x2220),
+      "apos" => U(0x27),
+      "aring" => U(0xE5),
+      "asymp" => U(0x2248),
+      "atilde" => U(0xE3),
+      "auml" => U(0xE4),
+      "bdquo" => U(0x201E),
+      "beta" => U(0x03B2),
+      "brvbar" => U(0xA6),
+      "bull" => U(0x2022),
+      "cap" => U(0x2229),
+      "ccedil" => U(0xE7),
+      "cedil" => U(0xB8),
+      "cent" => U(0xA2),
+      "chi" => U(0x03C7),
+      "circ" => U(0x02C6),
+      "clubs" => U(0x2663),
+      "cong" => U(0x2245),
+      "copy" => U(0xA9),
+      "COPY" => U(0xA9),
+      "crarr" => U(0x21B5),
+      "cup" => U(0x222A),
+      "curren" => U(0xA4),
+      "dArr" => U(0x21D3),
+      "dagger" => U(0x2020),
+      "darr" => U(0x2193),
+      "deg" => U(0xB0),
+      "delta" => U(0x03B4),
+      "diams" => U(0x2666),
+      "divide" => U(0xF7),
+      "eacute" => U(0xE9),
+      "ecirc" => U(0xEA),
+      "egrave" => U(0xE8),
+      "empty" => U(0x2205),
+      "emsp" => U(0x2003),
+      "ensp" => U(0x2002),
+      "epsilon" => U(0x03B5),
+      "equiv" => U(0x2261),
+      "eta" => U(0x03B7),
+      "eth" => U(0xF0),
+      "euml" => U(0xEB),
+      "euro" => U(0x20AC),
+      "exist" => U(0x2203),
+      "fnof" => U(0x0192),
+      "forall" => U(0x2200),
+      "frac12" => U(0xBD),
+      "frac14" => U(0xBC),
+      "frac34" => U(0xBE),
+      "frasl" => U(0x2044),
+      "gamma" => U(0x03B3),
+      "ge" => U(0x2265),
+      "gt" => U(0x3E),
+      "GT" => U(0x3E),
+      "hArr" => U(0x21D4),
+      "harr" => U(0x2194),
+      "hearts" => U(0x2665),
+      "hellip" => U(0x2026),
+      "iacute" => U(0xED),
+      "icirc" => U(0xEE),
+      "iexcl" => U(0xA1),
+      "igrave" => U(0xEC),
+      "image" => U(0x2111),
+      "infin" => U(0x221E),
+      "int" => U(0x222B),
+      "iota" => U(0x03B9),
+      "iquest" => U(0xBF),
+      "isin" => U(0x2208),
+      "iuml" => U(0xEF),
+      "kappa" => U(0x03BA),
+      "lArr" => U(0x21D0),
+      "lambda" => U(0x03BB),
+      "lang" => U(0x2329),
+      "laquo" => U(0xAB),
+      "larr" => U(0x2190),
+      "lceil" => U(0x2308),
+      "ldquo" => U(0x201C),
+      "le" => U(0x2264),
+      "lfloor" => U(0x230A),
+      "lowast" => U(0x2217),
+      "loz" => U(0x25CA),
+      "lrm" => U(0x200E),
+      "lsaquo" => U(0x2039),
+      "lsquo" => U(0x2018),
+      "lt" => U(0x3C),
+      "LT" => U(0x3C),
+      "macr" => U(0xAF),
+      "mdash" => U(0x2014),
+      "micro" => U(0xB5),
+      "middot" => U(0xB7),
+      "minus" => U(0x2212),
+      "mu" => U(0x03BC),
+      "nabla" => U(0x2207),
+      "nbsp" => U(0xA0),
+      "ndash" => U(0x2013),
+      "ne" => U(0x2260),
+      "ni" => U(0x220B),
+      "not" => U(0xAC),
+      "notin" => U(0x2209),
+      "nsub" => U(0x2284),
+      "ntilde" => U(0xF1),
+      "nu" => U(0x03BD),
+      "oacute" => U(0xF3),
+      "ocirc" => U(0xF4),
+      "oelig" => U(0x0153),
+      "ograve" => U(0xF2),
+      "oline" => U(0x203E),
+      "omega" => U(0x03C9),
+      "omicron" => U(0x03BF),
+      "oplus" => U(0x2295),
+      "or" => U(0x2228),
+      "ordf" => U(0xAA),
+      "ordm" => U(0xBA),
+      "oslash" => U(0xF8),
+      "otilde" => U(0xF5),
+      "otimes" => U(0x2297),
+      "ouml" => U(0xF6),
+      "para" => U(0xB6),
+      "part" => U(0x2202),
+      "permil" => U(0x2030),
+      "perp" => U(0x22A5),
+      "phi" => U(0x03C6),
+      "pi" => U(0x03C0),
+      "piv" => U(0x03D6),
+      "plusmn" => U(0xB1),
+      "pound" => U(0xA3),
+      "prime" => U(0x2032),
+      "prod" => U(0x220F),
+      "prop" => U(0x221D),
+      "psi" => U(0x03C8),
+      "quot" => U(0x22),
+      "QUOT" => U(0x22),
+      "rArr" => U(0x21D2),
+      "radic" => U(0x221A),
+      "rang" => U(0x232A),
+      "raquo" => U(0xBB),
+      "rarr" => U(0x2192),
+      "rceil" => U(0x2309),
+      "rdquo" => U(0x201D),
+      "real" => U(0x211C),
+      "reg" => U(0xAE),
+      "REG" => U(0xAE),
+      "rfloor" => U(0x230B),
+      "rho" => U(0x03C1),
+      "rlm" => U(0x200F),
+      "rsaquo" => U(0x203A),
+      "rsquo" => U(0x2019),
+      "sbquo" => U(0x201A),
+      "scaron" => U(0x0161),
+      "sdot" => U(0x22C5),
+      "sect" => U(0xA7),
+      "shy" => U(0xAD),
+      "sigma" => U(0x03C3),
+      "sigmaf" => U(0x03C2),
+      "sim" => U(0x223C),
+      "spades" => U(0x2660),
+      "sub" => U(0x2282),
+      "sube" => U(0x2286),
+      "sum" => U(0x2211),
+      "sup" => U(0x2283),
+      "sup1" => U(0xB9),
+      "sup2" => U(0xB2),
+      "sup3" => U(0xB3),
+      "supe" => U(0x2287),
+      "szlig" => U(0xDF),
+      "tau" => U(0x03C4),
+      "there4" => U(0x2234),
+      "theta" => U(0x03B8),
+      "thetasym" => U(0x03D1),
+      "thinsp" => U(0x2009),
+      "thorn" => U(0xFE),
+      "tilde" => U(0x02DC),
+      "times" => U(0xD7),
+      "trade" => U(0x2122),
+      "uArr" => U(0x21D1),
+      "uacute" => U(0xFA),
+      "uarr" => U(0x2191),
+      "ucirc" => U(0xFB),
+      "ugrave" => U(0xF9),
+      "uml" => U(0xA8),
+      "upsih" => U(0x03D2),
+      "upsilon" => U(0x03C5),
+      "uuml" => U(0xFC),
+      "weierp" => U(0x2118),
+      "xi" => U(0x03BE),
+      "yacute" => U(0xFD),
+      "yen" => U(0xA5),
+      "yuml" => U(0xFF),
+      "zeta" => U(0x03B6),
+      "zwj" => U(0x200D),
+      "zwnj" => U(0x200C)
+  }
 
-ENCODINGS = %w[
-    ansi_x3.4-1968
-    iso-ir-6
-    ansi_x3.4-1986
-    iso_646.irv:1991
-    ascii
-    iso646-us
-    us-ascii
-    us
-    ibm367
-    cp367
-    csascii
-    ks_c_5601-1987
-    korean
-    iso-2022-kr
-    csiso2022kr
-    euc-kr
-    iso-2022-jp
-    csiso2022jp
-    iso-2022-jp-2
-    iso-ir-58
-    chinese
-    csiso58gb231280
-    iso_8859-1:1987
-    iso-ir-100
-    iso_8859-1
-    iso-8859-1
-    latin1
-    l1
-    ibm819
-    cp819
-    csisolatin1
-    iso_8859-2:1987
-    iso-ir-101
-    iso_8859-2
-    iso-8859-2
-    latin2
-    l2
-    csisolatin2
-    iso_8859-3:1988
-    iso-ir-109
-    iso_8859-3
-    iso-8859-3
-    latin3
-    l3
-    csisolatin3
-    iso_8859-4:1988
-    iso-ir-110
-    iso_8859-4
-    iso-8859-4
-    latin4
-    l4
-    csisolatin4
-    iso_8859-6:1987
-    iso-ir-127
-    iso_8859-6
-    iso-8859-6
-    ecma-114
-    asmo-708
-    arabic
-    csisolatinarabic
-    iso_8859-7:1987
-    iso-ir-126
-    iso_8859-7
-    iso-8859-7
-    elot_928
-    ecma-118
-    greek
-    greek8
-    csisolatingreek
-    iso_8859-8:1988
-    iso-ir-138
-    iso_8859-8
-    iso-8859-8
-    hebrew
-    csisolatinhebrew
-    iso_8859-5:1988
-    iso-ir-144
-    iso_8859-5
-    iso-8859-5
-    cyrillic
-    csisolatincyrillic
-    iso_8859-9:1989
-    iso-ir-148
-    iso_8859-9
-    iso-8859-9
-    latin5
-    l5
-    csisolatin5
-    iso-8859-10
-    iso-ir-157
-    l6
-    iso_8859-10:1992
-    csisolatin6
-    latin6
-    hp-roman8
-    roman8
-    r8
-    ibm037
-    cp037
-    csibm037
-    ibm424
-    cp424
-    csibm424
-    ibm437
-    cp437
-    437
-    cspc8codepage437
-    ibm500
-    cp500
-    csibm500
-    ibm775
-    cp775
-    cspc775baltic
-    ibm850
-    cp850
-    850
-    cspc850multilingual
-    ibm852
-    cp852
-    852
-    cspcp852
-    ibm855
-    cp855
-    855
-    csibm855
-    ibm857
-    cp857
-    857
-    csibm857
-    ibm860
-    cp860
-    860
-    csibm860
-    ibm861
-    cp861
-    861
-    cp-is
-    csibm861
-    ibm862
-    cp862
-    862
-    cspc862latinhebrew
-    ibm863
-    cp863
-    863
-    csibm863
-    ibm864
-    cp864
-    csibm864
-    ibm865
-    cp865
-    865
-    csibm865
-    ibm866
-    cp866
-    866
-    csibm866
-    ibm869
-    cp869
-    869
-    cp-gr
-    csibm869
-    ibm1026
-    cp1026
-    csibm1026
-    koi8-r
-    cskoi8r
-    koi8-u
-    big5-hkscs
-    ptcp154
-    csptcp154
-    pt154
-    cp154
-    utf-7
-    utf-16be
-    utf-16le
-    utf-16
-    utf-8
-    iso-8859-13
-    iso-8859-14
-    iso-ir-199
-    iso_8859-14:1998
-    iso_8859-14
-    latin8
-    iso-celtic
-    l8
-    iso-8859-15
-    iso_8859-15
-    iso-8859-16
-    iso-ir-226
-    iso_8859-16:2001
-    iso_8859-16
-    latin10
-    l10
-    gbk
-    cp936
-    ms936
-    gb18030
-    shift_jis
-    ms_kanji
-    csshiftjis
-    euc-jp
-    gb2312
-    big5
-    csbig5
-    windows-1250
-    windows-1251
-    windows-1252
-    windows-1253
-    windows-1254
-    windows-1255
-    windows-1256
-    windows-1257
-    windows-1258
-    tis-620
-    hz-gb-2312
-]
+  ENCODINGS = %w[
+      ansi_x3.4-1968
+      iso-ir-6
+      ansi_x3.4-1986
+      iso_646.irv:1991
+      ascii
+      iso646-us
+      us-ascii
+      us
+      ibm367
+      cp367
+      csascii
+      ks_c_5601-1987
+      korean
+      iso-2022-kr
+      csiso2022kr
+      euc-kr
+      iso-2022-jp
+      csiso2022jp
+      iso-2022-jp-2
+      iso-ir-58
+      chinese
+      csiso58gb231280
+      iso_8859-1:1987
+      iso-ir-100
+      iso_8859-1
+      iso-8859-1
+      latin1
+      l1
+      ibm819
+      cp819
+      csisolatin1
+      iso_8859-2:1987
+      iso-ir-101
+      iso_8859-2
+      iso-8859-2
+      latin2
+      l2
+      csisolatin2
+      iso_8859-3:1988
+      iso-ir-109
+      iso_8859-3
+      iso-8859-3
+      latin3
+      l3
+      csisolatin3
+      iso_8859-4:1988
+      iso-ir-110
+      iso_8859-4
+      iso-8859-4
+      latin4
+      l4
+      csisolatin4
+      iso_8859-6:1987
+      iso-ir-127
+      iso_8859-6
+      iso-8859-6
+      ecma-114
+      asmo-708
+      arabic
+      csisolatinarabic
+      iso_8859-7:1987
+      iso-ir-126
+      iso_8859-7
+      iso-8859-7
+      elot_928
+      ecma-118
+      greek
+      greek8
+      csisolatingreek
+      iso_8859-8:1988
+      iso-ir-138
+      iso_8859-8
+      iso-8859-8
+      hebrew
+      csisolatinhebrew
+      iso_8859-5:1988
+      iso-ir-144
+      iso_8859-5
+      iso-8859-5
+      cyrillic
+      csisolatincyrillic
+      iso_8859-9:1989
+      iso-ir-148
+      iso_8859-9
+      iso-8859-9
+      latin5
+      l5
+      csisolatin5
+      iso-8859-10
+      iso-ir-157
+      l6
+      iso_8859-10:1992
+      csisolatin6
+      latin6
+      hp-roman8
+      roman8
+      r8
+      ibm037
+      cp037
+      csibm037
+      ibm424
+      cp424
+      csibm424
+      ibm437
+      cp437
+      437
+      cspc8codepage437
+      ibm500
+      cp500
+      csibm500
+      ibm775
+      cp775
+      cspc775baltic
+      ibm850
+      cp850
+      850
+      cspc850multilingual
+      ibm852
+      cp852
+      852
+      cspcp852
+      ibm855
+      cp855
+      855
+      csibm855
+      ibm857
+      cp857
+      857
+      csibm857
+      ibm860
+      cp860
+      860
+      csibm860
+      ibm861
+      cp861
+      861
+      cp-is
+      csibm861
+      ibm862
+      cp862
+      862
+      cspc862latinhebrew
+      ibm863
+      cp863
+      863
+      csibm863
+      ibm864
+      cp864
+      csibm864
+      ibm865
+      cp865
+      865
+      csibm865
+      ibm866
+      cp866
+      866
+      csibm866
+      ibm869
+      cp869
+      869
+      cp-gr
+      csibm869
+      ibm1026
+      cp1026
+      csibm1026
+      koi8-r
+      cskoi8r
+      koi8-u
+      big5-hkscs
+      ptcp154
+      csptcp154
+      pt154
+      cp154
+      utf-7
+      utf-16be
+      utf-16le
+      utf-16
+      utf-8
+      iso-8859-13
+      iso-8859-14
+      iso-ir-199
+      iso_8859-14:1998
+      iso_8859-14
+      latin8
+      iso-celtic
+      l8
+      iso-8859-15
+      iso_8859-15
+      iso-8859-16
+      iso-ir-226
+      iso_8859-16:2001
+      iso_8859-16
+      latin10
+      l10
+      gbk
+      cp936
+      ms936
+      gb18030
+      shift_jis
+      ms_kanji
+      csshiftjis
+      euc-jp
+      gb2312
+      big5
+      csbig5
+      windows-1250
+      windows-1251
+      windows-1252
+      windows-1253
+      windows-1254
+      windows-1255
+      windows-1256
+      windows-1257
+      windows-1258
+      tis-620
+      hz-gb-2312
+  ]
 
 end
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser.rb
index abbb89a6..178ed574 100644
--- a/vendor/plugins/HTML5lib/lib/html5lib/html5parser.rb
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser.rb
@@ -2,141 +2,131 @@ require 'html5lib/constants'
 require 'html5lib/tokenizer'
 require 'html5lib/treebuilders/rexml'
 
+Dir.glob(File.join(File.dirname(__FILE__), 'html5parser', '*_phase.rb')).each do |path|
+  require 'html5lib/html5parser/' + File.basename(path)
+end
+
 module HTML5lib
 
-# HTML parser. Generates a tree structure from a stream of (possibly
-# malformed) HTML
-class HTMLParser
+  # Error in parsed document
+  class ParseError < Exception; end
+  class AssertionError < Exception; end
+
+  # HTML parser. Generates a tree structure from a stream of (possibly malformed) HTML
+  #
+  class HTMLParser
 
     attr_accessor :phase, :firstStartTag, :innerHTML, :lastPhase, :insertFromTable
 
     attr_reader :phases, :tokenizer, :tree, :errors
 
-    # convenience methods
     def self.parse(stream, options = {})
-        encoding = options.delete(:encoding)
-        new(options).parse(stream,encoding)
+      encoding = options.delete(:encoding)
+      new(options).parse(stream,encoding)
     end
 
     def self.parseFragment(stream, options = {})
-        container = options.delete(:container) || 'div'
-        encoding = options.delete(:encoding)
-        new(options).parseFragment(stream,container,encoding)
+      container = options.delete(:container) || 'div'
+      encoding = options.delete(:encoding)
+      new(options).parseFragment(stream,container,encoding)
     end
 
-    @@phases = [
-        :initial,
-        :rootElement,
-        :beforeHead,
-        :inHead,
-        :afterHead,
-        :inBody,
-        :inTable,
-        :inCaption,
-        :inColumnGroup,
-        :inTableBody,
-        :inRow,
-        :inCell,
-        :inSelect,
-        :afterBody,
-        :inFrameset,
-        :afterFrameset,
-        :trailingEnd
-    ]
+    @@phases = %w( initial rootElement beforeHead inHead afterHead inBody inTable inCaption
+      inColumnGroup inTableBody inRow inCell inSelect afterBody inFrameset afterFrameset trailingEnd )
 
     # :strict - raise an exception when a parse error is encountered
     # :tree - a treebuilder class controlling the type of tree that will be
     # returned. Built in treebuilders can be accessed through
     # html5lib.treebuilders.getTreeBuilder(treeType)
     def initialize(options = {})
-        @strict = false
-        @errors = []
-       
-        @tokenizer =  HTMLTokenizer
-        @tree = TreeBuilders::REXMLTree::TreeBuilder
+      @strict = false
+      @errors = []
+     
+      @tokenizer =  HTMLTokenizer
+      @tree = TreeBuilders::REXMLTree::TreeBuilder
  
-        options.each { |name, value| instance_variable_set("@#{name}", value) }
+      options.each { |name, value| instance_variable_set("@#{name}", value) }
 
-        @tree = @tree.new
+      @tree = @tree.new
 
-        @phases = @@phases.inject({}) do |phases, symbol|
-            class_name = symbol.to_s.sub(/(.)/) { $1.upcase } + 'Phase'
-            phases[symbol] = HTML5lib.const_get(class_name).new(self, @tree)
-            phases 
-        end
+      @phases = @@phases.inject({}) do |phases, phase_name|
+        phase_class_name = phase_name.sub(/(.)/) { $1.upcase } + 'Phase'
+        phases[phase_name.to_sym] = HTML5lib.const_get(phase_class_name).new(self, @tree)
+        phases 
+      end
     end
 
     def _parse(stream, innerHTML, encoding, container = 'div')
-        @tree.reset
-        @firstStartTag = false
-        @errors = []
+      @tree.reset
+      @firstStartTag = false
+      @errors = []
 
-        @tokenizer = @tokenizer.class unless Class === @tokenizer
-        @tokenizer = @tokenizer.new(stream, :encoding => encoding, :parseMeta => innerHTML)
+      @tokenizer = @tokenizer.class unless Class === @tokenizer
+      @tokenizer = @tokenizer.new(stream, :encoding => encoding, :parseMeta => innerHTML)
 
-        if innerHTML
-            case @innerHTML = container.downcase
-                when 'title', 'textarea'
-                    @tokenizer.contentModelFlag = :RCDATA
-                when 'style', 'script', 'xmp', 'iframe', 'noembed', 'noframes', 'noscript'
-                    @tokenizer.contentModelFlag = :CDATA
-                when 'plaintext'
-                    @tokenizer.contentModelFlag = :PLAINTEXT
-                else
-                # contentModelFlag already is PCDATA
-                #@tokenizer.contentModelFlag = :PCDATA
-            end
-            
-            @phase = @phases[:rootElement]
-            @phase.insertHtmlElement
-            resetInsertionMode
-        else
-            @innerHTML = false
-            @phase = @phases[:initial]
+      if innerHTML
+        case @innerHTML = container.downcase
+          when 'title', 'textarea'
+            @tokenizer.contentModelFlag = :RCDATA
+          when 'style', 'script', 'xmp', 'iframe', 'noembed', 'noframes', 'noscript'
+            @tokenizer.contentModelFlag = :CDATA
+          when 'plaintext'
+            @tokenizer.contentModelFlag = :PLAINTEXT
+          else
+          # contentModelFlag already is PCDATA
+          #@tokenizer.contentModelFlag = :PCDATA
         end
+      
+        @phase = @phases[:rootElement]
+        @phase.insertHtmlElement
+        resetInsertionMode
+      else
+        @innerHTML = false
+        @phase = @phases[:initial]
+      end
 
-        # We only seem to have InBodyPhase testcases where the following is
-        # relevant ... need others too
-        @lastPhase = nil
+      # We only seem to have InBodyPhase testcases where the following is
+      # relevant ... need others too
+      @lastPhase = nil
 
-        # XXX This is temporary for the moment so there isn't any other
-        # changes needed for the parser to work with the iterable tokenizer
-        @tokenizer.each do |token|
-            token = normalizeToken(token)
+      # XXX This is temporary for the moment so there isn't any other
+      # changes needed for the parser to work with the iterable tokenizer
+      @tokenizer.each do |token|
+        token = normalizeToken(token)
 
-            method = 'process%s' % token[:type]
+        method = 'process%s' % token[:type]
 
-            case token[:type]
-                when :Characters, :SpaceCharacters, :Comment
-                    @phase.send method, token[:data]
-                when :StartTag, :Doctype
-                    @phase.send method, token[:name], token[:data]
-                when :EndTag
-                    @phase.send method, token[:name]
-                else
-                    parseError(token[:data])
-            end
+        case token[:type]
+          when :Characters, :SpaceCharacters, :Comment
+            @phase.send method, token[:data]
+          when :StartTag, :Doctype
+            @phase.send method, token[:name], token[:data]
+          when :EndTag
+            @phase.send method, token[:name]
+          else
+            parseError(token[:data])
         end
+      end
 
-        # When the loop finishes it's EOF
-        @phase.processEOF
-     end
-
-     # Parse a HTML document into a well-formed tree
-     #
-     # stream - a filelike object or string containing the HTML to be parsed
-     #
-     # The optional encoding parameter must be a string that indicates
-     # the encoding.  If specified, that encoding will be used,
-     # regardless of any BOM or later declaration (such as in a meta
-     # element)
-    def parse(stream, encoding = nil)
-        _parse(stream, false, encoding)
-        return @tree.getDocument
+      # When the loop finishes it's EOF
+      @phase.processEOF
     end
-    
+
+    # Parse a HTML document into a well-formed tree
+    #
+    # stream - a filelike object or string containing the HTML to be parsed
+    #
+    # The optional encoding parameter must be a string that indicates
+    # the encoding.  If specified, that encoding will be used,
+    # regardless of any BOM or later declaration (such as in a meta
+    # element)
+    def parse(stream, encoding=nil)
+      _parse(stream, false, encoding)
+      return @tree.getDocument
+    end
+  
     # Parse a HTML fragment into a well-formed tree fragment
-        
+    
     # container - name of the element we're setting the innerHTML property
     # if set to nil, default to 'div'
     #
@@ -146,15 +136,15 @@ class HTMLParser
     # the encoding.  If specified, that encoding will be used,
     # regardless of any BOM or later declaration (such as in a meta
     # element)
-    def parseFragment(stream, container = 'div', encoding = nil)
-        _parse(stream, true, encoding, container)
-        return @tree.getFragment
+    def parseFragment(stream, container='div', encoding=nil)
+      _parse(stream, true, encoding, container)
+      return @tree.getFragment
     end
 
     def parseError(data = 'XXX ERROR MESSAGE NEEDED')
-        # XXX The idea is to make data mandatory.
-        @errors.push([@tokenizer.stream.position, data])
-        raise ParseError if @strict
+      # XXX The idea is to make data mandatory.
+      @errors.push([@tokenizer.stream.position, data])
+      raise ParseError if @strict
     end
 
     # This error is not an error
@@ -164,1857 +154,95 @@ class HTMLParser
     # HTML5 specific normalizations to the token stream
     def normalizeToken(token)
 
-        if token[:type] == :EmptyTag
-            # When a solidus (/) is encountered within a tag name what happens
-            # depends on whether the current tag name matches that of a void
-            # element.  If it matches a void element atheists did the wrong
-            # thing and if it doesn't it's wrong for everyone.
+      if token[:type] == :EmptyTag
+        # When a solidus (/) is encountered within a tag name what happens
+        # depends on whether the current tag name matches that of a void
+        # element.  If it matches a void element atheists did the wrong
+        # thing and if it doesn't it's wrong for everyone.
 
-            if VOID_ELEMENTS.include?(token[:name])
-                atheistParseError
-            else
-                parseError(_('Solidus (/) incorrectly placed in tag.'))
-            end
-
-            token[:type] = :StartTag
+        if VOID_ELEMENTS.include?(token[:name])
+          atheistParseError
+        else
+          parseError(_('Solidus (/) incorrectly placed in tag.'))
         end
 
-        if token[:type] == :StartTag
-            token[:name] = token[:name].tr(ASCII_UPPERCASE,ASCII_LOWERCASE)
+        token[:type] = :StartTag
+      end
 
-            # We need to remove the duplicate attributes and convert attributes
-            # to a dict so that [["x", "y"], ["x", "z"]] becomes {"x": "y"}
+      if token[:type] == :StartTag
+        token[:name] = token[:name].tr(ASCII_UPPERCASE,ASCII_LOWERCASE)
 
-            if token[:data].length
-                token[:data] = Hash[*token[:data].reverse.map {|attr,value|
-                  [attr.tr(ASCII_UPPERCASE,ASCII_LOWERCASE),value]
-                }.flatten]
-            else
-                token[:data] = {}
-            end
+        # We need to remove the duplicate attributes and convert attributes
+        # to a dict so that [["x", "y"], ["x", "z"]] becomes {"x": "y"}
 
-        elsif token[:type] == :EndTag
-            parseError(_('End tag contains unexpected attributes.')) if token[:data]
-            token[:name] = token[:name].downcase
+        unless token[:data].empty?
+          data = token[:data].reverse.map { |attr, value| [attr.tr(ASCII_UPPERCASE, ASCII_LOWERCASE), value] }
+          token[:data] = Hash[*data.flatten]
         end
 
-        return token
+      elsif token[:type] == :EndTag
+        parseError(_('End tag contains unexpected attributes.')) if token[:data]
+        token[:name] = token[:name].downcase
+      end
+
+      return token
     end
 
     @@new_modes = {
-        'select' => :inSelect,
-        'td' => :inCell,
-        'th' => :inCell,
-        'tr' => :inRow,
-        'tbody' => :inTableBody,
-        'thead' => :inTableBody,
-        'tfoot' => :inTableBody,
-        'caption' => :inCaption,
-        'colgroup' => :inColumnGroup,
-        'table' => :inTable,
-        'head' => :inBody,
-        'body' => :inBody,
-        'frameset' => :inFrameset
+      'select' => :inSelect,
+      'td' => :inCell,
+      'th' => :inCell,
+      'tr' => :inRow,
+      'tbody' => :inTableBody,
+      'thead' => :inTableBody,
+      'tfoot' => :inTableBody,
+      'caption' => :inCaption,
+      'colgroup' => :inColumnGroup,
+      'table' => :inTable,
+      'head' => :inBody,
+      'body' => :inBody,
+      'frameset' => :inFrameset
     }
 
     def resetInsertionMode
-        # The name of this method is mostly historical. (It's also used in the
-        # specification.)
-        last = false
+      # The name of this method is mostly historical. (It's also used in the
+      # specification.)
+      last = false
 
-        @tree.openElements.reverse.each do |node|
-            nodeName = node.name
+      @tree.openElements.reverse.each do |node|
+        nodeName = node.name
 
-            if node == @tree.openElements[0]
-                last = true
-                unless ['td', 'th'].include?(nodeName)
-                    # XXX
-                    # assert @innerHTML
-                    nodeName = @innerHTML
-                end
-            end
-
-            # Check for conditions that should only happen in the innerHTML
-            # case
-            if ['select', 'colgroup', 'head', 'frameset'].include?(nodeName)
-                # XXX
-                # assert @innerHTML
-            end
-
-            if @@new_modes.has_key?(nodeName)
-                @phase = @phases[@@new_modes[nodeName]]
-            elsif nodeName == 'html'
-                @phase = @phases[@tree.headPointer.nil?? :beforeHead : :afterHead]
-            elsif last
-                @phase = @phases[:inBody]
-            else
-                next
-            end
-
-            break
+        if node == @tree.openElements[0]
+          last = true
+          unless ['td', 'th'].include?(nodeName)
+            # XXX
+            # assert @innerHTML
+            nodeName = @innerHTML
+          end
         end
+
+        # Check for conditions that should only happen in the innerHTML
+        # case
+        if ['select', 'colgroup', 'head', 'frameset'].include?(nodeName)
+          # XXX
+          # assert @innerHTML
+        end
+
+        if @@new_modes.has_key?(nodeName)
+          @phase = @phases[@@new_modes[nodeName]]
+        elsif nodeName == 'html'
+          @phase = @phases[@tree.headPointer.nil?? :beforeHead : :afterHead]
+        elsif last
+          @phase = @phases[:inBody]
+        else
+          next
+        end
+
+        break
+      end
     end
 
     def _(string); string; end
-end
-
-# Base class for helper object that implements each phase of processing
-class Phase
-    # Order should be (they can be omitted)
-    # * EOF
-    # * Comment
-    # * Doctype
-    # * SpaceCharacters
-    # * Characters
-    # * StartTag
-    #   - startTag* methods
-    # * EndTag
-    #   - endTag* methods
-
-   def self.tag_handler_map(default,array)
-        array.inject(Hash.new(default)) do |map, (names, value)|
-            names = [names] unless Array === names
-            names.each { |name| map[name] = value }
-            map
-        end
-    end
-
-    def self.start_tag_handlers
-        @start_tag_handlers
-    end
-
-    def self.handle_start(tags)
-        @start_tag_handlers = tag_handler_map(:startTagOther, tags)
-    end
-
-    def self.end_tag_handlers
-        @end_tag_handlers
-    end
-
-    def self.handle_end(tags)
-        @end_tag_handlers = tag_handler_map(:endTagOther, tags)
-    end
-
-    def initialize(parser, tree)
-        @parser = parser
-        @tree = tree
-    end
-
-    def processEOF
-        @tree.generateImpliedEndTags
-
-        if @tree.openElements.length > 2
-            @parser.parseError(_('Unexpected end of file. Missing closing tags.'))
-        elsif @tree.openElements.length == 2 and @tree.openElements[1].name != 'body'
-            # This happens for framesets or something?
-            @parser.parseError(_("Unexpected end of file. Expected end tag (#{@tree.openElements[1].name}) first."))
-        elsif @parser.innerHTML and @tree.openElements.length > 1 
-            # XXX This is not what the specification says. Not sure what to do here.
-            @parser.parseError(_('XXX innerHTML EOF'))
-        end
-        # Betting ends.
-    end
-
-    def processComment(data)
-        # For most phases the following is correct. Where it's not it will be
-        # overridden.
-        @tree.insertComment(data, @tree.openElements[-1])
-    end
-
-    def processDoctype(name, error)
-        @parser.parseError(_('Unexpected DOCTYPE. Ignored.'))
-    end
-
-    def processSpaceCharacters(data)
-        @tree.insertText(data)
-    end
-
-    def processStartTag(name, attributes)
-        send self.class.start_tag_handlers[name], name, attributes
-    end
-
-    def startTagHtml(name, attributes)
-        if @parser.firstStartTag == false and name == 'html'
-           @parser.parseError(_('html needs to be the first start tag.'))
-        end
-        # XXX Need a check here to see if the first start tag token emitted is
-        # this token... If it's not, invoke @parser.parseError.
-        attributes.each do |attr, value|
-            unless @tree.openElements[0].attributes.has_key?(attr)
-                @tree.openElements[0].attributes[attr] = value
-            end
-        end
-        @parser.firstStartTag = false
-    end
-
-    def processEndTag(name)
-        send self.class.end_tag_handlers[name], name
-    end
-
-    def _(string)
-        string
-    end
-
-    def assert(value)
-        throw AssertionError.new unless value
-    end
-
-    def in_scope?(*args)
-        @tree.elementInScope(*args)
-    end
-
-    def remove_open_elements_until(name = nil)
-        finished = false
-        until finished
-            element = @tree.openElements.pop
-            finished = name.nil?? yield(element) : element.name == name
-        end
-        return element
-    end
-
-end
-
-
-class InitialPhase < Phase
-    # This phase deals with error handling as well which is currently not
-    # covered in the specification. The error handling is typically known as
-    # "quirks mode". It is expected that a future version of HTML5 will defin
-    # this.
-    def processEOF
-        @parser.parseError(_('Unexpected End of file. Expected DOCTYPE.'))
-        @parser.phase = @parser.phases[:rootElement]
-        @parser.phase.processEOF
-    end
-
-    def processComment(data)
-        @tree.insertComment(data, @tree.document)
-    end
-
-    def processDoctype(name, error)
-        @parser.parseError(_('Erroneous DOCTYPE.')) if error
-        @tree.insertDoctype(name)
-        @parser.phase = @parser.phases[:rootElement]
-    end
-
-    def processSpaceCharacters(data)
-        @tree.insertText(data, @tree.document)
-    end
-
-    def processCharacters(data)
-        @parser.parseError(_('Unexpected non-space characters. Expected DOCTYPE.'))
-        @parser.phase = @parser.phases[:rootElement]
-        @parser.phase.processCharacters(data)
-    end
-
-    def processStartTag(name, attributes)
-        @parser.parseError(_("Unexpected start tag (#{name}). Expected DOCTYPE."))
-        @parser.phase = @parser.phases[:rootElement]
-        @parser.phase.processStartTag(name, attributes)
-    end
-
-    def processEndTag(name)
-        @parser.parseError(_("Unexpected end tag (#{name}). Expected DOCTYPE."))
-        @parser.phase = @parser.phases[:rootElement]
-        @parser.phase.processEndTag(name)
-    end
-end
-
-
-class RootElementPhase < Phase
-    # helper methods
-    def insertHtmlElement
-        element = @tree.createElement('html', {})
-        @tree.openElements.push(element)
-        @tree.document.appendChild(element)
-        @parser.phase = @parser.phases[:beforeHead]
-    end
-
-    # other
-    def processEOF
-        insertHtmlElement
-        @parser.phase.processEOF
-    end
-
-    def processComment(data)
-        @tree.insertComment(data, @tree.document)
-    end
-
-    def processSpaceCharacters(data)
-        @tree.insertText(data, @tree.document)
-    end
-
-    def processCharacters(data)
-        insertHtmlElement
-        @parser.phase.processCharacters(data)
-    end
-
-    def processStartTag(name, attributes)
-        @parser.firstStartTag = true if name == 'html'
-        insertHtmlElement
-        @parser.phase.processStartTag(name, attributes)
-    end
-
-    def processEndTag(name)
-        insertHtmlElement
-        @parser.phase.processEndTag(name)
-    end
-end
-
-
-class BeforeHeadPhase < Phase
-
-    handle_start [
-        ['html', :startTagHtml],
-        ['head', :startTagHead]
-    ]
-
-    handle_end [
-        ['html', :endTagHtml]
-    ]
-
-    def processEOF
-        startTagHead('head', {})
-        @parser.phase.processEOF
-    end
-
-    def processCharacters(data)
-        startTagHead('head', {})
-        @parser.phase.processCharacters(data)
-    end
-
-    def startTagHead(name, attributes)
-        @tree.insertElement(name, attributes)
-        @tree.headPointer = @tree.openElements[-1]
-        @parser.phase = @parser.phases[:inHead]
-    end
-
-    def startTagOther(name, attributes)
-        startTagHead('head', {})
-        @parser.phase.processStartTag(name, attributes)
-    end
-
-    def endTagHtml(name)
-        startTagHead('head', {})
-        @parser.phase.processEndTag(name)
-    end
-
-    def endTagOther(name)
-        @parser.parseError(_("Unexpected end tag (#{name}) after the (implied) root element."))
-    end
-end
-
-class InHeadPhase < Phase
-
-    handle_start [
-        ['html', :startTagHtml],
-        ['title', :startTagTitle],
-        ['style', :startTagStyle],
-        ['script', :startTagScript],
-        [['base', 'link', 'meta'], :startTagBaseLinkMeta],
-        ['head', :startTagHead]
-    ]
-
-    handle_end [
-        ['head', :endTagHead],
-        ['html', :endTagHtml],
-        [['title', 'style', 'script'], :endTagTitleStyleScript]
-    ]
-
-    # helper
-    def appendToHead(element)
-        if @tree.headPointer.nil?
-            assert @parser.innerHTML
-            @tree.openElements[-1].appendChild(element)
-        else
-            @tree.headPointer.appendChild(element)
-        end
-    end
-
-    # the real thing
-    def processEOF
-        if ['title', 'style', 'script'].include?(name = @tree.openElements[-1].name)
-            @parser.parseError(_("Unexpected end of file. Expected end tag (#{name})."))
-            @tree.openElements.pop
-        end
-        anythingElse
-        @parser.phase.processEOF
-    end
-
-    def processCharacters(data)
-        if ['title', 'style', 'script'].include?(@tree.openElements[-1].name)
-            @tree.insertText(data)
-        else
-            anythingElse
-            @parser.phase.processCharacters(data)
-        end
-    end
-
-    def startTagHead(name, attributes)
-        @parser.parseError(_('Unexpected start tag head in existing head. Ignored'))
-    end
-
-    def startTagTitle(name, attributes)
-        element = @tree.createElement(name, attributes)
-        appendToHead(element)
-        @tree.openElements.push(element)
-        @parser.tokenizer.contentModelFlag = :RCDATA
-    end
-
-    def startTagStyle(name, attributes)
-        element = @tree.createElement(name, attributes)
-        if @tree.headPointer != nil and @parser.phase == @parser.phases[:inHead]
-            appendToHead(element)
-        else
-            @tree.openElements[-1].appendChild(element)
-        end
-        @tree.openElements.push(element)
-        @parser.tokenizer.contentModelFlag = :CDATA
-    end
-
-    def startTagScript(name, attributes)
-        #XXX Inner HTML case may be wrong
-        element = @tree.createElement(name, attributes)
-        element._flags.push("parser-inserted")
-        if (@tree.headPointer != nil and
-            @parser.phase == @parser.phases[:inHead])
-            appendToHead(element)
-        else
-            @tree.openElements[-1].appendChild(element)
-        end
-        @tree.openElements.push(element)
-        @parser.tokenizer.contentModelFlag = :CDATA
-    end
-
-    def startTagBaseLinkMeta(name, attributes)
-        element = @tree.createElement(name, attributes)
-        appendToHead(element)
-    end
-
-    def startTagOther(name, attributes)
-        anythingElse
-        @parser.phase.processStartTag(name, attributes)
-    end
-
-    def endTagHead(name)
-        if @tree.openElements[-1].name == 'head'
-            @tree.openElements.pop
-        else
-            @parser.parseError(_("Unexpected end tag (head). Ignored."))
-        end
-        @parser.phase = @parser.phases[:afterHead]
-    end
-
-    def endTagHtml(name)
-        anythingElse
-        @parser.phase.processEndTag(name)
-    end
-
-    def endTagTitleStyleScript(name)
-        if @tree.openElements[-1].name == name
-            @tree.openElements.pop
-        else
-            @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
-        end
-    end
-
-    def endTagOther(name)
-        @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
-    end
-
-    def anythingElse
-        if @tree.openElements[-1].name == 'head'
-            endTagHead('head')
-        else
-            @parser.phase = @parser.phases[:afterHead]
-        end
-    end
-end
-
-class AfterHeadPhase < Phase
-    
-    handle_start [
-        ['html', :startTagHtml],
-        ['body', :startTagBody],
-        ['frameset', :startTagFrameset],
-        [['base', 'link', 'meta', 'script', 'style', 'title'], :startTagFromHead]
-    ]
-
-    def processEOF
-        anythingElse
-        @parser.phase.processEOF
-    end
-
-    def processCharacters(data)
-        anythingElse
-        @parser.phase.processCharacters(data)
-    end
-
-    def startTagBody(name, attributes)
-        @tree.insertElement(name, attributes)
-        @parser.phase = @parser.phases[:inBody]
-    end
-
-    def startTagFrameset(name, attributes)
-        @tree.insertElement(name, attributes)
-        @parser.phase = @parser.phases[:inFrameset]
-    end
-
-    def startTagFromHead(name, attributes)
-        @parser.parseError(_("Unexpected start tag (#{name}) that can be in head. Moved."))
-        @parser.phase = @parser.phases[:inHead]
-        @parser.phase.processStartTag(name, attributes)
-    end
-
-    def startTagOther(name, attributes)
-        anythingElse
-        @parser.phase.processStartTag(name, attributes)
-    end
-
-    def processEndTag(name)
-        anythingElse
-        @parser.phase.processEndTag(name)
-    end
-
-    def anythingElse
-        @tree.insertElement('body', {})
-        @parser.phase = @parser.phases[:inBody]
-    end
-end
-
-
-class InBodyPhase < Phase
-    # http://www.whatwg.org/specs/web-apps/current-work/#in-body
-    # the crazy mode
-
-    handle_start [
-        ['html', :startTagHtml],
-        [['script', 'style'], :startTagScriptStyle],
-        [['base', 'link', 'meta', 'title'], :startTagFromHead],
-        ['body', :startTagBody],
-        [['address', 'blockquote', 'center', 'dir', 'div', 'dl',
-          'fieldset', 'listing', 'menu', 'ol', 'p', 'pre', 'ul'],
-          :startTagCloseP],
-        ['form', :startTagForm],
-        [['li', 'dd', 'dt'], :startTagListItem],
-        ['plaintext',:startTagPlaintext],
-        [HEADING_ELEMENTS, :startTagHeading],
-        ['a', :startTagA],
-        [['b', 'big', 'em', 'font', 'i', 'nobr', 's', 'small', 'strike',
-          'strong', 'tt', 'u'],:startTagFormatting],
-        ['button', :startTagButton],
-        [['marquee', 'object'], :startTagMarqueeObject],
-        ['xmp', :startTagXmp],
-        ['table', :startTagTable],
-        [['area', 'basefont', 'bgsound', 'br', 'embed', 'img', 'param',
-          'spacer', 'wbr'], :startTagVoidFormatting],
-        ['hr', :startTagHr],
-        ['image', :startTagImage],
-        ['input', :startTagInput],
-        ['isindex', :startTagIsIndex],
-        ['textarea', :startTagTextarea],
-        [['iframe', 'noembed', 'noframes', 'noscript'], :startTagCdata],
-        ['select', :startTagSelect],
-        [['caption', 'col', 'colgroup', 'frame', 'frameset', 'head',
-          'option', 'optgroup', 'tbody', 'td', 'tfoot', 'th', 'thead',
-          'tr'], :startTagMisplaced],
-        [['event-source', 'section', 'nav', 'article', 'aside', 'header',
-          'footer', 'datagrid', 'command'], :startTagNew]
-    ]
-
-    handle_end [
-        ['p',:endTagP],
-        ['body',:endTagBody],
-        ['html',:endTagHtml],
-        [['address', 'blockquote', 'center', 'div', 'dl', 'fieldset',
-          'listing', 'menu', 'ol', 'pre', 'ul'], :endTagBlock],
-        ['form', :endTagForm],
-        [['dd', 'dt', 'li'], :endTagListItem],
-        [HEADING_ELEMENTS, :endTagHeading],
-        [['a', 'b', 'big', 'em', 'font', 'i', 'nobr', 's', 'small',
-          'strike', 'strong', 'tt', 'u'], :endTagFormatting],
-        [['marquee', 'object', 'button'], :endTagButtonMarqueeObject],
-        [['head', 'frameset', 'select', 'optgroup', 'option', 'table',
-          'caption', 'colgroup', 'col', 'thead', 'tfoot', 'tbody', 'tr',
-          'td', 'th'], :endTagMisplaced],
-        [['area', 'basefont', 'bgsound', 'br', 'embed', 'hr', 'image',
-          'img', 'input', 'isindex', 'param', 'spacer', 'wbr', 'frame'],
-          :endTagNone],
-        [['noframes', 'noscript', 'noembed', 'textarea', 'xmp', 'iframe'],
-          :endTagCdataTextAreaXmp],
-        [['event-source', 'section', 'nav', 'article', 'aside', 'header',
-          'footer', 'datagrid', 'command'], :endTagNew]
-    ]
-
-    def initialize(parser, tree)
-        super(parser, tree)
-
-        # for special handling of whitespace in <pre>
-        @processSpaceCharactersPre = false
-    end
-
-    # helper
-    def addFormattingElement(name, attributes)
-        @tree.insertElement(name, attributes)
-        @tree.activeFormattingElements.push(@tree.openElements[-1])
-    end
-
-    # the real deal
-    def processSpaceCharactersPre(data)
-        #Sometimes (start of <pre> blocks) we want to drop leading newlines
-        @processSpaceCharactersPre = false
-        if (data.length > 0 and data[0] == ?\n and 
-            @tree.openElements[-1].name == 'pre' and
-            not @tree.openElements[-1].hasContent)
-            data = data[1..-1]
-        end
-        @tree.insertText(data) if data.length > 0
-    end
-
-    def processSpaceCharacters(data)
-        if @processSpaceCharactersPre
-            processSpaceCharactersPre(data)
-        else
-            super(data)
-        end
-    end
-
-    def processCharacters(data)
-        # XXX The specification says to do this for every character at the
-        # moment, but apparently that doesn't match the real world so we don't
-        # do it for space characters.
-        @tree.reconstructActiveFormattingElements
-        @tree.insertText(data)
-    end
-
-    def startTagScriptStyle(name, attributes)
-        @parser.phases[:inHead].processStartTag(name, attributes)
-    end
-
-    def startTagFromHead(name, attributes)
-        @parser.parseError(_("Unexpected start tag (#{name}) that belongs in the head. Moved."))
-        @parser.phases[:inHead].processStartTag(name, attributes)
-    end
-
-    def startTagBody(name, attributes)
-        @parser.parseError(_('Unexpected start tag (body).'))
-
-        if (@tree.openElements.length == 1 or
-            @tree.openElements[1].name != 'body')
-            assert @parser.innerHTML
-        else
-            attributes.each do |attr, value|
-                unless @tree.openElements[1].attributes.has_key?(attr)
-                    @tree.openElements[1].attributes[attr] = value
-                end
-            end
-        end
-    end
-
-    def startTagCloseP(name, attributes)
-        endTagP('p') if in_scope?('p')
-        @tree.insertElement(name, attributes)
-        @processSpaceCharactersPre = true if name == 'pre'
-    end
-
-    def startTagForm(name, attributes)
-        if @tree.formPointer
-            @parser.parseError('Unexpected start tag (form). Ignored.')
-        else
-            endTagP('p') if in_scope?('p')
-            @tree.insertElement(name, attributes)
-            @tree.formPointer = @tree.openElements[-1]
-        end
-    end
-
-    def startTagListItem(name, attributes)
-        endTagP('p') if in_scope?('p')
-        stopNames = {'li' => ['li'], 'dd' => ['dd', 'dt'], 'dt' => ['dd', 'dt']}
-        stopName = stopNames[name]
-
-        @tree.openElements.reverse.each_with_index do |node,i|
-            if stopName.include?(node.name)
-                (i+1).times { @tree.openElements.pop }
-                break
-            end
-
-            # Phrasing elements are all non special, non scoping, non
-            # formatting elements
-            break if ((SPECIAL_ELEMENTS + SCOPING_ELEMENTS).include?(node.name) and
-              not ['address', 'div'].include?(node.name))
-        end
-
-        # Always insert an <li> element.
-        @tree.insertElement(name, attributes)
-    end
-
-    def startTagPlaintext(name, attributes)
-        endTagP('p') if in_scope?('p')
-        @tree.insertElement(name, attributes)
-        @parser.tokenizer.contentModelFlag = :PLAINTEXT
-    end
-
-    def startTagHeading(name, attributes)
-        endTagP('p') if in_scope?('p')
-        HEADING_ELEMENTS.each do |element|
-            if in_scope?(element)
-                @parser.parseError(_("Unexpected start tag (#{name})."))
-                
-                remove_open_elements_until { |element| HEADING_ELEMENTS.include?(element.name) }
-
-                break
-             end
-        end
-        @tree.insertElement(name, attributes)
-    end
-
-    def startTagA(name, attributes)
-        if afeAElement = @tree.elementInActiveFormattingElements('a')
-            @parser.parseError(_('Unexpected start tag (a) implies end tag (a).'))
-            endTagFormatting('a')
-            @tree.openElements.delete(afeAElement) if @tree.openElements.include?(afeAElement)
-            @tree.activeFormattingElements.delete(afeAElement) if @tree.activeFormattingElements.include?(afeAElement)
-        end
-        @tree.reconstructActiveFormattingElements
-        addFormattingElement(name, attributes)
-    end
-
-    def startTagFormatting(name, attributes)
-        @tree.reconstructActiveFormattingElements
-        addFormattingElement(name, attributes)
-    end
-
-    def startTagButton(name, attributes)
-        if in_scope?('button')
-            @parser.parseError(_('Unexpected start tag (button) implied end tag (button).'))
-            processEndTag('button')
-            @parser.phase.processStartTag(name, attributes)
-        else
-            @tree.reconstructActiveFormattingElements
-            @tree.insertElement(name, attributes)
-            @tree.activeFormattingElements.push(Marker)
-        end
-    end
-
-    def startTagMarqueeObject(name, attributes)
-        @tree.reconstructActiveFormattingElements
-        @tree.insertElement(name, attributes)
-        @tree.activeFormattingElements.push(Marker)
-    end
-
-    def startTagXmp(name, attributes)
-        @tree.reconstructActiveFormattingElements
-        @tree.insertElement(name, attributes)
-        @parser.tokenizer.contentModelFlag = :CDATA
-    end
-
-    def startTagTable(name, attributes)
-        processEndTag('p') if in_scope?('p')
-        @tree.insertElement(name, attributes)
-        @parser.phase = @parser.phases[:inTable]
-    end
-
-    def startTagVoidFormatting(name, attributes)
-        @tree.reconstructActiveFormattingElements
-        @tree.insertElement(name, attributes)
-        @tree.openElements.pop
-    end
-
-    def startTagHr(name, attributes)
-        endTagP('p') if in_scope?('p')
-        @tree.insertElement(name, attributes)
-        @tree.openElements.pop
-    end
-
-    def startTagImage(name, attributes)
-        # No really...
-        @parser.parseError(_('Unexpected start tag (image). Treated as img.'))
-        processStartTag('img', attributes)
-    end
-
-    def startTagInput(name, attributes)
-        @tree.reconstructActiveFormattingElements
-        @tree.insertElement(name, attributes)
-        if @tree.formPointer
-            # XXX Not exactly sure what to do here
-            # @tree.openElements[-1].form = @tree.formPointer
-        end
-        @tree.openElements.pop
-    end
-
-    def startTagIsIndex(name, attributes)
-        @parser.parseError("Unexpected start tag isindex. Don't use it!")
-        return if @tree.formPointer
-        processStartTag('form', {})
-        processStartTag('hr', {})
-        processStartTag('p', {})
-        processStartTag('label', {})
-        # XXX Localization ...
-        processCharacters('This is a searchable index. Insert your search keywords here:')
-        attributes['name'] = 'isindex'
-        attrs = attributes.to_a
-        processStartTag('input', attributes)
-        processEndTag('label')
-        processEndTag('p')
-        processStartTag('hr', {})
-        processEndTag('form')
-    end
-
-    def startTagTextarea(name, attributes)
-        # XXX Form element pointer checking here as well...
-        @tree.insertElement(name, attributes)
-        @parser.tokenizer.contentModelFlag = :RCDATA
-    end
-
-    # iframe, noembed noframes, noscript(if scripting enabled)
-    def startTagCdata(name, attributes)
-        @tree.insertElement(name, attributes)
-        @parser.tokenizer.contentModelFlag = :CDATA
-    end
-
-    def startTagSelect(name, attributes)
-        @tree.reconstructActiveFormattingElements
-        @tree.insertElement(name, attributes)
-        @parser.phase = @parser.phases[:inSelect]
-    end
-
-    def startTagMisplaced(name, attributes)
-        # Elements that should be children of other elements that have a
-        # different insertion mode; here they are ignored
-        # "caption", "col", "colgroup", "frame", "frameset", "head",
-        # "option", "optgroup", "tbody", "td", "tfoot", "th", "thead",
-        # "tr", "noscript"
-        @parser.parseError(_("Unexpected start tag (#{name}). Ignored."))
-    end
-
-    def startTagNew(name, attributes)
-        # New HTML5 elements, "event-source", "section", "nav",
-        # "article", "aside", "header", "footer", "datagrid", "command"
-        sys.stderr.write("Warning: Undefined behaviour for start tag #{name}")
-        startTagOther(name, attributes)
-        #raise NotImplementedError
-    end
-
-    def startTagOther(name, attributes)
-        @tree.reconstructActiveFormattingElements
-        @tree.insertElement(name, attributes)
-    end
-
-    def endTagP(name)
-        @tree.generateImpliedEndTags('p') if in_scope?('p')
-        @parser.parseError('Unexpected end tag (p).') unless @tree.openElements[-1].name == 'p'
-        @tree.openElements.pop while in_scope?('p')
-    end
-
-    def endTagBody(name)
-        # XXX Need to take open <p> tags into account here. We shouldn't imply
-        # </p> but we should not throw a parse error either. Specification is
-        # likely to be updated.
-        unless @tree.openElements[1].name == 'body'
-            # innerHTML case
-            @parser.parseError
-            return
-        end
-        unless @tree.openElements[-1].name == 'body'
-            @parser.parseError(_("Unexpected end tag (body). Missing end tag (#{@tree.openElements[-1].name})."))
-        end
-        @parser.phase = @parser.phases[:afterBody]
-    end
-
-    def endTagHtml(name)
-        endTagBody(name)
-        @parser.phase.processEndTag(name) unless @parser.innerHTML
-    end
-
-    def endTagBlock(name)
-        #Put us back in the right whitespace handling mode
-        @processSpaceCharactersPre = false if name == 'pre'
-
-        @tree.generateImpliedEndTags if in_scope?(name)
-
-        unless @tree.openElements[-1].name == name
-            @parser.parseError(("End tag (#{name}) seen too early. Expected other end tag."))
-        end
-
-        if in_scope?(name)
-            remove_open_elements_until(name)
-        end
-    end
-
-    def endTagForm(name)
-        endTagBlock(name)
-        @tree.formPointer = nil
-    end
-
-    def endTagListItem(name)
-        # AT Could merge this with the Block case
-        if in_scope?(name)
-            @tree.generateImpliedEndTags(name)
-
-            unless @tree.openElements[-1].name == name
-                @parser.parseError(("End tag (#{name}) seen too early. Expected other end tag."))
-            end
-        end
-
-        remove_open_elements_until(name) if in_scope?(name)
-    end    
-
-    def endTagHeading(name)
-        HEADING_ELEMENTS.each do |element|
-            if in_scope?(element)
-                @tree.generateImpliedEndTags
-                break
-            end
-        end
-
-        unless @tree.openElements[-1].name == name
-            @parser.parseError(("Unexpected end tag (#{name}). Expected other end tag."))
-        end
-
-        HEADING_ELEMENTS.each do |element|
-            if in_scope?(element)
-                remove_open_elements_until { |element| HEADING_ELEMENTS.include?(element.name) }
-                break
-            end
-        end
-    end
-
-    # The much-feared adoption agency algorithm
-    def endTagFormatting(name)
-        # http://www.whatwg.org/specs/web-apps/current-work/#adoptionAgency
-        # XXX Better parseError messages appreciated.
-        while true
-            # Step 1 paragraph 1
-            afeElement = @tree.elementInActiveFormattingElements(name)
-            if not afeElement or (@tree.openElements.include?(afeElement) and not in_scope?(afeElement.name))
-                @parser.parseError(_("End tag (#{name}) violates step 1, paragraph 1 of the adoption agency algorithm."))
-                return
-            # Step 1 paragraph 2
-            elsif not @tree.openElements.include?(afeElement)
-                @parser.parseError(_("End tag (#{name}) violates step 1, paragraph 2 of the adoption agency algorithm."))
-                @tree.activeFormattingElements.delete(afeElement)
-                return
-            end
-
-            # Step 1 paragraph 3
-            if afeElement != @tree.openElements[-1]
-                @parser.parseError(_("End tag (#{name}) violates step 1, paragraph 3 of the adoption agency algorithm."))
-            end
-
-            # Step 2
-            # Start of the adoption agency algorithm proper
-            afeIndex = @tree.openElements.index(afeElement)
-            furthestBlock = nil
-            @tree.openElements[afeIndex..-1].each do |element|
-                if (SPECIAL_ELEMENTS + SCOPING_ELEMENTS).include?(element.name)
-                    furthestBlock = element
-                    break
-                end
-            end
-
-            # Step 3
-            if furthestBlock.nil?
-                element = remove_open_elements_until { |element| element == afeElement }
-                @tree.activeFormattingElements.delete(element)
-                return
-            end
-            commonAncestor = @tree.openElements[afeIndex-1]
-
-            # Step 5
-            furthestBlock.parent.removeChild(furthestBlock) if furthestBlock.parent
-
-            # Step 6
-            # The bookmark is supposed to help us identify where to reinsert
-            # nodes in step 12. We have to ensure that we reinsert nodes after
-            # the node before the active formatting element. Note the bookmark
-            # can move in step 7.4
-            bookmark = @tree.activeFormattingElements.index(afeElement)
-
-            # Step 7
-            lastNode = node = furthestBlock
-            while true
-                # AT replace this with a function and recursion?
-                # Node is element before node in open elements
-                node = @tree.openElements[@tree.openElements.index(node)-1]
-                until @tree.activeFormattingElements.include?(node)
-                    tmpNode = node
-                    node = @tree.openElements[@tree.openElements.index(node)-1]
-                    @tree.openElements.delete(tmpNode)
-                end
-                # Step 7.3
-                break if node == afeElement
-                # Step 7.4
-                if lastNode == furthestBlock
-                    # XXX should this be index(node) or index(node)+1
-                    # Anne: I think +1 is ok. Given x = [2,3,4,5]
-                    # x.index(3) gives 1 and then x[1 +1] gives 4...
-                    bookmark = @tree.activeFormattingElements.index(node) + 1
-                end
-                # Step 7.5
-                cite = node.parent
-                if node.hasContent
-                    clone = node.cloneNode
-                    # Replace node with clone
-                    @tree.activeFormattingElements[@tree.activeFormattingElements.index(node)] = clone
-                    @tree.openElements[@tree.openElements.index(node)] = clone
-                    node = clone
-                end
-                # Step 7.6
-                # Remove lastNode from its parents, if any
-                lastNode.parent.removeChild(lastNode) if lastNode.parent
-                node.appendChild(lastNode)
-                # Step 7.7
-                lastNode = node
-                # End of inner loop
-            end
-
-            # Step 8
-            lastNode.parent.removeChild(lastNode) if lastNode.parent
-            commonAncestor.appendChild(lastNode)
-
-            # Step 9
-            clone = afeElement.cloneNode
-
-            # Step 10
-            furthestBlock.reparentChildren(clone)
-
-            # Step 11
-            furthestBlock.appendChild(clone)
-
-            # Step 12
-            @tree.activeFormattingElements.delete(afeElement)
-            @tree.activeFormattingElements.insert([bookmark,@tree.activeFormattingElements.length].min, clone)
-
-            # Step 13
-            @tree.openElements.delete(afeElement)
-            @tree.openElements.insert(@tree.openElements.index(furthestBlock) + 1, clone)
-        end
-    end
-
-    def endTagButtonMarqueeObject(name)
-        @tree.generateImpliedEndTags if in_scope?(name)
-
-        unless @tree.openElements[-1].name == name
-            @parser.parseError(_("Unexpected end tag (#{name}). Expected other end tag first."))
-        end
-
-        if in_scope?(name)
-            remove_open_elements_until(name)
-            
-            @tree.clearActiveFormattingElements
-        end
-    end
-
-    def endTagMisplaced(name)
-        # This handles elements with end tags in other insertion modes.
-        @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
-    end
-
-    def endTagNone(name)
-        # This handles elements with no end tag.
-        @parser.parseError(_("This tag (#{name}) has no end tag"))
-    end
-
-    def endTagCdataTextAreaXmp(name)
-        if @tree.openElements[-1].name == name
-            @tree.openElements.pop
-        else
-            @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
-        end
-    end
-
-    def endTagNew(name)
-        # New HTML5 elements, "event-source", "section", "nav",
-        # "article", "aside", "header", "footer", "datagrid", "command"
-        STDERR.puts "Warning: Undefined behaviour for end tag #{name}"
-        endTagOther(name)
-        #raise NotImplementedError
-    end
-
-    def endTagOther(name)
-        # XXX This logic should be moved into the treebuilder
-        @tree.openElements.reverse.each do |node|
-            if node.name == name
-                @tree.generateImpliedEndTags
-
-                unless @tree.openElements[-1].name == name
-                    @parser.parseError(_("Unexpected end tag (#{name})."))
-                end
-
-                remove_open_elements_until { |element| element == node }
-
-                break
-            else
-                if (SPECIAL_ELEMENTS + SCOPING_ELEMENTS).include?(node.name)
-                    @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
-                    break
-                end
-            end
-        end
-    end
-end
-
-class InTablePhase < Phase
-    # http://www.whatwg.org/specs/web-apps/current-work/#in-table
-
-    handle_start [
-        ['html', :startTagHtml],
-        ['caption', :startTagCaption],
-        ['colgroup', :startTagColgroup],
-        ['col', :startTagCol],
-        [['tbody', 'tfoot', 'thead'], :startTagRowGroup],
-        [['td', 'th', 'tr'], :startTagImplyTbody],
-        ['table', :startTagTable]
-    ]
-
-    handle_end [
-        ['table', :endTagTable],
-        [['body', 'caption', 'col', 'colgroup', 'html', 'tbody', 'td', 'tfoot', 'th', 'thead', 'tr'], :endTagIgnore]
-    ]
-
-    # helper methods
-    def clearStackToTableContext
-        # "clear the stack back to a table context"
-        until ['table', 'html'].include?(name = @tree.openElements[-1].name)
-            @parser.parseError(_("Unexpected implied end tag (#{name}) in the table phase."))
-            @tree.openElements.pop
-        end
-        # When the current node is <html> it's an innerHTML case
-    end
-
-    # processing methods
-    def processCharacters(data)
-        @parser.parseError(_("Unexpected non-space characters in table context caused voodoo mode."))
-        # Make all the special element rearranging voodoo kick in
-        @tree.insertFromTable = true
-        # Process the character in the "in body" mode
-        @parser.phases[:inBody].processCharacters(data)
-        @tree.insertFromTable = false
-    end
-
-    def startTagCaption(name, attributes)
-        clearStackToTableContext
-        @tree.activeFormattingElements.push(Marker)
-        @tree.insertElement(name, attributes)
-        @parser.phase = @parser.phases[:inCaption]
-    end
-
-    def startTagColgroup(name, attributes)
-        clearStackToTableContext
-        @tree.insertElement(name, attributes)
-        @parser.phase = @parser.phases[:inColumnGroup]
-    end
-
-    def startTagCol(name, attributes)
-        startTagColgroup('colgroup', {})
-        @parser.phase.processStartTag(name, attributes)
-    end
-
-    def startTagRowGroup(name, attributes)
-        clearStackToTableContext
-        @tree.insertElement(name, attributes)
-        @parser.phase = @parser.phases[:inTableBody]
-    end
-
-    def startTagImplyTbody(name, attributes)
-        startTagRowGroup('tbody', {})
-        @parser.phase.processStartTag(name, attributes)
-    end
-
-    def startTagTable(name, attributes)
-        @parser.parseError(_("Unexpected start tag (table) in table phase. Implies end tag (table)."))
-        @parser.phase.processEndTag('table')
-        @parser.phase.processStartTag(name, attributes) unless @parser.innerHTML
-    end
-
-    def startTagOther(name, attributes)
-        @parser.parseError(_("Unexpected start tag (#{name}) in table context caused voodoo mode."))
-        # Make all the special element rearranging voodoo kick in
-        @tree.insertFromTable = true
-        # Process the start tag in the "in body" mode
-        @parser.phases[:inBody].processStartTag(name, attributes)
-        @tree.insertFromTable = false
-    end
-
-    def endTagTable(name)
-        if in_scope?('table', true)
-            @tree.generateImpliedEndTags
-            
-            unless @tree.openElements[-1].name == 'table'
-                @parser.parseError(_("Unexpected end tag (table). Expected end tag (#{@tree.openElements[-1].name})."))
-            end
-            
-            remove_open_elements_until('table')
-
-            @parser.resetInsertionMode
-        else
-            # innerHTML case
-            assert @parser.innerHTML
-            @parser.parseError
-        end
-    end
-
-    def endTagIgnore(name)
-        @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
-    end
-
-    def endTagOther(name)
-        @parser.parseError(_("Unexpected end tag (#{name}) in table context caused voodoo mode."))
-        # Make all the special element rearranging voodoo kick in
-        @parser.insertFromTable = true
-        # Process the end tag in the "in body" mode
-        @parser.phases[:inBody].processEndTag(name)
-        @parser.insertFromTable = false
-    end
-end
-
-
-class InCaptionPhase < Phase
-    # http://www.whatwg.org/specs/web-apps/current-work/#in-caption
-
-    handle_start [
-        ['html', :startTagHtml],
-        [['caption', 'col', 'colgroup', 'tbody', 'td', 'tfoot', 'th', 'thead', 'tr'], :startTagTableElement]
-    ]
-
-    handle_end [
-        ['caption', :endTagCaption],
-        ['table', :endTagTable],
-        [['body', 'col', 'colgroup', 'html', 'tbody', 'td', 'tfoot', 'th', 'thead', 'tr'], :endTagIgnore]
-    ]
-
-    def ignoreEndTagCaption
-        not in_scope?('caption', true)
-    end
-
-    def processCharacters(data)
-        @parser.phases[:inBody].processCharacters(data)
-    end
-
-    def startTagTableElement(name, attributes)
-        @parser.parseError
-        #XXX Have to duplicate logic here to find out if the tag is ignored
-        ignoreEndTag = ignoreEndTagCaption
-        @parser.phase.processEndTag('caption')
-        @parser.phase.processStartTag(name, attributes) unless ignoreEndTag
-    end
-
-    def startTagOther(name, attributes)
-        @parser.phases[:inBody].processStartTag(name, attributes)
-    end
-
-    def endTagCaption(name)
-        if ignoreEndTagCaption
-            # innerHTML case
-            assert @parser.innerHTML
-            @parser.parseError
-        else
-            # AT this code is quite similar to endTagTable in "InTable"
-            @tree.generateImpliedEndTags
-
-            unless @tree.openElements[-1].name == 'caption'
-                @parser.parseError(_("Unexpected end tag (caption). Missing end tags."))
-            end
-
-            remove_open_elements_until('caption')
-
-            @tree.clearActiveFormattingElements
-            @parser.phase = @parser.phases[:inTable]
-        end
-    end
-
-    def endTagTable(name)
-        @parser.parseError
-        ignoreEndTag = ignoreEndTagCaption
-        @parser.phase.processEndTag('caption')
-        @parser.phase.processEndTag(name) unless ignoreEndTag
-    end
-
-    def endTagIgnore(name)
-        @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
-    end
-
-    def endTagOther(name)
-        @parser.phases[:inBody].processEndTag(name)
-    end
-end
-
-
-class InColumnGroupPhase < Phase
-    # http://www.whatwg.org/specs/web-apps/current-work/#in-column
-
-    handle_start [
-        ['html', :startTagHtml],
-        ['col', :startTagCol]
-    ]
-
-    handle_end [
-        ['colgroup', :endTagColgroup],
-        ['col', :endTagCol]
-    ]
-
-    def ignoreEndTagColgroup
-        @tree.openElements[-1].name == 'html'
-    end
-
-    def processCharacters(data)
-        ignoreEndTag = ignoreEndTagColgroup
-        endTagColgroup("colgroup")
-        @parser.phase.processCharacters(data) unless ignoreEndTag
-    end
-
-    def startTagCol(name, attributes)
-        @tree.insertElement(name, attributes)
-        @tree.openElements.pop
-    end
-
-    def startTagOther(name, attributes)
-        ignoreEndTag = ignoreEndTagColgroup
-        endTagColgroup('colgroup')
-        @parser.phase.processStartTag(name, attributes) unless ignoreEndTag
-    end
-
-    def endTagColgroup(name)
-        if ignoreEndTagColgroup
-            # innerHTML case
-            assert @parser.innerHTML
-            @parser.parseError
-        else
-            @tree.openElements.pop
-            @parser.phase = @parser.phases[:inTable]
-        end
-    end
-
-    def endTagCol(name)
-        @parser.parseError(_('Unexpected end tag (col). col has no end tag.'))
-    end
-
-    def endTagOther(name)
-        ignoreEndTag = ignoreEndTagColgroup
-        endTagColgroup('colgroup')
-        @parser.phase.processEndTag(name) unless ignoreEndTag
-    end
-end
-
-
-class InTableBodyPhase < Phase
-    # http://www.whatwg.org/specs/web-apps/current-work/#in-table0
-
-    handle_start [
-        ['html', :startTagHtml],
-        ['tr', :startTagTr],
-        [['td', 'th'], :startTagTableCell],
-        [['caption', 'col', 'colgroup', 'tbody', 'tfoot', 'thead'], :startTagTableOther]
-    ]
-
-    handle_end [
-        [['tbody', 'tfoot', 'thead'], :endTagTableRowGroup],
-        ['table', :endTagTable],
-        [['body', 'caption', 'col', 'colgroup', 'html', 'td', 'th', 'tr'], :endTagIgnore]
-    ]
-
-    # helper methods
-    def clearStackToTableBodyContext
-        until ['tbody', 'tfoot', 'thead', 'html'].include?(name = @tree.openElements[-1].name)
-            @parser.parseError(_("Unexpected implied end tag (#{name}) in the table body phase."))
-            @tree.openElements.pop
-        end
-    end
-
-    # the rest
-    def processCharacters(data)
-        @parser.phases[:inTable].processCharacters(data)
-    end
-
-    def startTagTr(name, attributes)
-        clearStackToTableBodyContext
-        @tree.insertElement(name, attributes)
-        @parser.phase = @parser.phases[:inRow]
-    end
-
-    def startTagTableCell(name, attributes)
-        @parser.parseError(_("Unexpected table cell start tag (#{name}) in the table body phase."))
-        startTagTr('tr', {})
-        @parser.phase.processStartTag(name, attributes)
-    end
-
-    def startTagTableOther(name, attributes)
-        # XXX AT Any ideas on how to share this with endTagTable?
-        if in_scope?('tbody', true) or in_scope?('thead', true) or in_scope?('tfoot', true)
-            clearStackToTableBodyContext
-            endTagTableRowGroup(@tree.openElements[-1].name)
-            @parser.phase.processStartTag(name, attributes)
-        else
-            # innerHTML case
-            @parser.parseError
-        end
-    end
-
-    def startTagOther(name, attributes)
-        @parser.phases[:inTable].processStartTag(name, attributes)
-    end
-
-    def endTagTableRowGroup(name)
-        if in_scope?(name, true)
-            clearStackToTableBodyContext
-            @tree.openElements.pop
-            @parser.phase = @parser.phases[:inTable]
-        else
-            @parser.parseError(_("Unexpected end tag (#{name}) in the table body phase. Ignored."))
-        end
-    end
-
-    def endTagTable(name)
-        if in_scope?('tbody', true) or in_scope?('thead', true) or in_scope?('tfoot', true)
-            clearStackToTableBodyContext
-            endTagTableRowGroup(@tree.openElements[-1].name)
-            @parser.phase.processEndTag(name)
-        else
-            # innerHTML case
-            @parser.parseError
-        end
-    end
-
-    def endTagIgnore(name)
-        @parser.parseError(_("Unexpected end tag (#{name}) in the table body phase. Ignored."))
-    end
-
-    def endTagOther(name)
-        @parser.phases[:inTable].processEndTag(name)
-    end
-end
-
-
-class InRowPhase < Phase
-    # http://www.whatwg.org/specs/web-apps/current-work/#in-row
-
-    handle_start [
-        ['html', :startTagHtml],
-        [['td', 'th'], :startTagTableCell],
-        [['caption', 'col', 'colgroup', 'tbody', 'tfoot', 'thead', 'tr'], :startTagTableOther]
-    ]
-
-    handle_end [
-        ['tr', :endTagTr],
-        ['table', :endTagTable],
-        [['tbody', 'tfoot', 'thead'], :endTagTableRowGroup],
-        [['body', 'caption', 'col', 'colgroup', 'html', 'td', 'th'], :endTagIgnore]
-    ]
-
-    # helper methods (XXX unify this with other table helper methods)
-    def clearStackToTableRowContext
-        until ['tr', 'html'].include?(name = @tree.openElements[-1].name)
-            @parser.parseError(_("Unexpected implied end tag (#{name}) in the row phase."))
-            @tree.openElements.pop
-        end
-    end
-
-    def ignoreEndTagTr
-        not in_scope?('tr', :tableVariant => true)
-    end
-
-    # the rest
-    def processCharacters(data)
-        @parser.phases[:inTable].processCharacters(data)
-    end
-
-    def startTagTableCell(name, attributes)
-        clearStackToTableRowContext
-        @tree.insertElement(name, attributes)
-        @parser.phase = @parser.phases[:inCell]
-        @tree.activeFormattingElements.push(Marker)
-    end
-
-    def startTagTableOther(name, attributes)
-        ignoreEndTag = ignoreEndTagTr
-        endTagTr('tr')
-        # XXX how are we sure it's always ignored in the innerHTML case?
-        @parser.phase.processStartTag(name, attributes) unless ignoreEndTag
-    end
-
-    def startTagOther(name, attributes)
-        @parser.phases[:inTable].processStartTag(name, attributes)
-    end
-
-    def endTagTr(name)
-        if ignoreEndTagTr
-            # innerHTML case
-            assert @parser.innerHTML
-            @parser.parseError
-        else
-            clearStackToTableRowContext
-            @tree.openElements.pop
-            @parser.phase = @parser.phases[:inTableBody]
-        end
-    end
-
-    def endTagTable(name)
-        ignoreEndTag = ignoreEndTagTr
-        endTagTr('tr')
-        # Reprocess the current tag if the tr end tag was not ignored
-        # XXX how are we sure it's always ignored in the innerHTML case?
-        @parser.phase.processEndTag(name) unless ignoreEndTag
-    end
-
-    def endTagTableRowGroup(name)
-        if in_scope?(name, true)
-            endTagTr('tr')
-            @parser.phase.processEndTag(name)
-        else
-            # innerHTML case
-            @parser.parseError
-        end
-    end
-
-    def endTagIgnore(name)
-        @parser.parseError(_("Unexpected end tag (#{name}) in the row phase. Ignored."))
-    end
-
-    def endTagOther(name)
-        @parser.phases[:inTable].processEndTag(name)
-    end
-end
-
-class InCellPhase < Phase
-    # http://www.whatwg.org/specs/web-apps/current-work/#in-cell
-
-    handle_start [
-        ['html', :startTagHtml],
-        [['caption', 'col', 'colgroup', 'tbody', 'td', 'tfoot', 'th', 'thead', 'tr'], :startTagTableOther]
-    ]
-
-    handle_end [
-        [['td', 'th'], :endTagTableCell],
-        [['body', 'caption', 'col', 'colgroup', 'html'], :endTagIgnore],
-        [['table', 'tbody', 'tfoot', 'thead', 'tr'], :endTagImply]
-    ]
-
-    # helper
-    def closeCell
-        if in_scope?('td', true)
-            endTagTableCell('td')
-        elsif in_scope?('th', true)
-            endTagTableCell('th')
-        end
-    end
-
-    # the rest
-    def processCharacters(data)
-        @parser.phases[:inBody].processCharacters(data)
-    end
-
-    def startTagTableOther(name, attributes)
-        if in_scope?('td', true) or in_scope?('th', true)
-            closeCell
-            @parser.phase.processStartTag(name, attributes)
-        else
-            # innerHTML case
-            @parser.parseError
-        end
-    end
-
-    def startTagOther(name, attributes)
-        @parser.phases[:inBody].processStartTag(name, attributes)
-    end
-
-    def endTagTableCell(name)
-        if in_scope?(name, true)
-            @tree.generateImpliedEndTags(name)
-            if @tree.openElements[-1].name != name
-                @parser.parseError("Got table cell end tag (#{name}) while required end tags are missing.")
-
-                remove_open_elements_until(name)
-            else
-                @tree.openElements.pop
-            end
-            @tree.clearActiveFormattingElements
-            @parser.phase = @parser.phases[:inRow]
-        else
-            @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
-        end
-    end
-
-    def endTagIgnore(name)
-        @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
-    end
-
-    def endTagImply(name)
-        if in_scope?(name, true)
-            closeCell
-            @parser.phase.processEndTag(name)
-        else
-            # sometimes innerHTML case
-            @parser.parseError
-        end
-    end
-
-    def endTagOther(name)
-        @parser.phases[:inBody].processEndTag(name)
-    end
-end
-
-
-class InSelectPhase < Phase
-    # http://www.whatwg.org/specs/web-apps/current-work/#in-select
-
-    handle_start [
-        ['html', :startTagHtml],
-        ['option', :startTagOption],
-        ['optgroup', :startTagOptgroup],
-        ['select', :startTagSelect]
-    ]
-
-    handle_end [
-        ['option', :endTagOption],
-        ['optgroup', :endTagOptgroup],
-        ['select', :endTagSelect],
-        [['caption', 'table', 'tbody', 'tfoot', 'thead', 'tr', 'td', 'th'], :endTagTableElements]
-    ]
-
-    def processCharacters(data)
-        @tree.insertText(data)
-    end
-
-    def startTagOption(name, attributes)
-        # We need to imply </option> if <option> is the current node.
-        @tree.openElements.pop if @tree.openElements[-1].name == 'option'
-        @tree.insertElement(name, attributes)
-    end
-
-    def startTagOptgroup(name, attributes)
-        @tree.openElements.pop if @tree.openElements[-1].name == 'option'
-        @tree.openElements.pop if @tree.openElements[-1].name == 'optgroup'
-        @tree.insertElement(name, attributes)
-    end
-
-    def startTagSelect(name, attributes)
-        @parser.parseError(_('Unexpected start tag (select) in the select phase implies select start tag.'))
-        endTagSelect('select')
-    end
-
-    def startTagOther(name, attributes)
-        @parser.parseError(_('Unexpected start tag token (#{name}) in the select phase. Ignored.'))
-    end
-
-    def endTagOption(name)
-        if @tree.openElements[-1].name == 'option'
-            @tree.openElements.pop
-        else
-            @parser.parseError(_('Unexpected end tag (option) in the select phase. Ignored.'))
-        end
-    end
-
-    def endTagOptgroup(name)
-        # </optgroup> implicitly closes <option>
-        if @tree.openElements[-1].name == 'option' and @tree.openElements[-2].name == 'optgroup'
-            @tree.openElements.pop
-        end
-        # It also closes </optgroup>
-        if @tree.openElements[-1].name == 'optgroup'
-            @tree.openElements.pop
-        # But nothing else
-        else
-            @parser.parseError(_('Unexpected end tag (optgroup) in the select phase. Ignored.'))
-        end
-    end
-
-    def endTagSelect(name)
-        if in_scope?('select', true)
-            remove_open_elements_until('select')
-
-            @parser.resetInsertionMode
-        else
-            # innerHTML case
-            @parser.parseError
-        end
-    end
-
-    def endTagTableElements(name)
-        @parser.parseError(_("Unexpected table end tag (#{name}) in the select phase."))
-
-        if in_scope?(name, true)
-            endTagSelect('select')
-            @parser.phase.processEndTag(name)
-        end
-    end
-
-    def endTagOther(name)
-        @parser.parseError(_("Unexpected end tag token (#{name}) in the select phase. Ignored."))
-    end
-end
-
-
-class AfterBodyPhase < Phase
-
-    handle_end [['html', :endTagHtml]]
-
-    def processComment(data)
-        # This is needed because data is to be appended to the <html> element
-        # here and not to whatever is currently open.
-        @tree.insertComment(data, @tree.openElements[0])
-    end
-
-    def processCharacters(data)
-        @parser.parseError(_('Unexpected non-space characters in the after body phase.'))
-        @parser.phase = @parser.phases[:inBody]
-        @parser.phase.processCharacters(data)
-    end
-
-    def processStartTag(name, attributes)
-        @parser.parseError(_("Unexpected start tag token (#{name}) in the after body phase."))
-        @parser.phase = @parser.phases[:inBody]
-        @parser.phase.processStartTag(name, attributes)
-    end
-
-    def endTagHtml(name)
-        if @parser.innerHTML
-            @parser.parseError
-        else
-            # XXX: This may need to be done, not sure
-            # Don't set lastPhase to the current phase but to the inBody phase
-            # instead. No need for extra parse errors if there's something after </html>.
-            # Try "<!doctype html>X</html>X" for instance.
-            @parser.lastPhase = @parser.phase
-            @parser.phase = @parser.phases[:trailingEnd]
-        end
-    end
-
-    def endTagOther(name)
-        @parser.parseError(_("Unexpected end tag token (#{name}) in the after body phase."))
-        @parser.phase = @parser.phases[:inBody]
-        @parser.phase.processEndTag(name)
-    end
-end
-
-class InFramesetPhase < Phase
-    # http://www.whatwg.org/specs/web-apps/current-work/#in-frameset
-
-    handle_start [
-        ['html', :startTagHtml],
-        ['frameset', :startTagFrameset],
-        ['frame', :startTagFrame],
-        ['noframes', :startTagNoframes]
-    ]
-
-    handle_end [
-        ['frameset', :endTagFrameset],
-        ['noframes', :endTagNoframes]
-    ]
-
-    def processCharacters(data)
-        @parser.parseError(_('Unexpected characters in the frameset phase. Characters ignored.'))
-    end
-
-    def startTagFrameset(name, attributes)
-        @tree.insertElement(name, attributes)
-    end
-
-    def startTagFrame(name, attributes)
-        @tree.insertElement(name, attributes)
-        @tree.openElements.pop
-    end
-
-    def startTagNoframes(name, attributes)
-        @parser.phases[:inBody].processStartTag(name, attributes)
-    end
-
-    def startTagOther(name, attributes)
-        @parser.parseError(_("Unexpected start tag token (#{name}) in the frameset phase. Ignored"))
-    end
-
-    def endTagFrameset(name)
-        if @tree.openElements[-1].name == 'html'
-            # innerHTML case
-            @parser.parseError(_("Unexpected end tag token (frameset) in the frameset phase (innerHTML)."))
-        else
-            @tree.openElements.pop
-        end
-        if (not @parser.innerHTML and
-            @tree.openElements[-1].name != 'frameset')
-            # If we're not in innerHTML mode and the the current node is not a
-            # "frameset" element (anymore) then switch.
-            @parser.phase = @parser.phases[:afterFrameset]
-        end
-    end
-
-    def endTagNoframes(name)
-        @parser.phases[:inBody].processEndTag(name)
-    end
-
-    def endTagOther(name)
-        @parser.parseError(_("Unexpected end tag token (#{name}) in the frameset phase. Ignored."))
-    end
-end
-
-
-class AfterFramesetPhase < Phase
-    # http://www.whatwg.org/specs/web-apps/current-work/#after3
-
-    handle_start [
-        ['html', :startTagHtml],
-        ['noframes', :startTagNoframes]
-    ]
-
-    handle_end [
-        ['html', :endTagHtml]
-    ]
-
-    def processCharacters(data)
-        @parser.parseError(_('Unexpected non-space characters in the after frameset phase. Ignored.'))
-    end
-
-    def startTagNoframes(name, attributes)
-        @parser.phases[:inBody].processStartTag(name, attributes)
-    end
-
-    def startTagOther(name, attributes)
-        @parser.parseError(_("Unexpected start tag (#{name}) in the after frameset phase. Ignored."))
-    end
-
-    def endTagHtml(name)
-        @parser.lastPhase = @parser.phase
-        @parser.phase = @parser.phases[:trailingEnd]
-    end
-
-    def endTagOther(name)
-        @parser.parseError(_("Unexpected end tag (#{name}) in the after frameset phase. Ignored."))
-    end
-end
-
-
-class TrailingEndPhase < Phase
-    def processEOF
-    end
-
-    def processComment(data)
-        @tree.insertComment(data, @tree.document)
-    end
-
-    def processSpaceCharacters(data)
-        @parser.lastPhase.processSpaceCharacters(data)
-    end
-
-    def processCharacters(data)
-        @parser.parseError(_('Unexpected non-space characters. Expected end of file.'))
-        @parser.phase = @parser.lastPhase
-        @parser.phase.processCharacters(data)
-    end
-
-    def processStartTag(name, attributes)
-        @parser.parseError(_('Unexpected start tag (#{name}). Expected end of file.'))
-        @parser.phase = @parser.lastPhase
-        @parser.phase.processStartTag(name, attributes)
-    end
-
-    def processEndTag(name)
-        @parser.parseError(_('Unexpected end tag (#{name}). Expected end of file.'))
-        @parser.phase = @parser.lastPhase
-        @parser.phase.processEndTag(name)
-    end
-end
-
-
-# Error in parsed document
-class ParseError < Exception; end
-class AssertionError < Exception; end
+  end
 
 end
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/after_body_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/after_body_phase.rb
new file mode 100644
index 00000000..27778ef1
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/after_body_phase.rb
@@ -0,0 +1,46 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class AfterBodyPhase < Phase
+
+    handle_end 'html'
+
+    def processComment(data)
+      # This is needed because data is to be appended to the <html> element
+      # here and not to whatever is currently open.
+      @tree.insertComment(data, @tree.openElements[0])
+    end
+
+    def processCharacters(data)
+      @parser.parseError(_('Unexpected non-space characters in the after body phase.'))
+      @parser.phase = @parser.phases[:inBody]
+      @parser.phase.processCharacters(data)
+    end
+
+    def processStartTag(name, attributes)
+      @parser.parseError(_("Unexpected start tag token (#{name}) in the after body phase."))
+      @parser.phase = @parser.phases[:inBody]
+      @parser.phase.processStartTag(name, attributes)
+    end
+
+    def endTagHtml(name)
+      if @parser.innerHTML
+        @parser.parseError
+      else
+        # XXX: This may need to be done, not sure
+        # Don't set lastPhase to the current phase but to the inBody phase
+        # instead. No need for extra parse errors if there's something after </html>.
+        # Try "<!doctype html>X</html>X" for instance.
+        @parser.lastPhase = @parser.phase
+        @parser.phase = @parser.phases[:trailingEnd]
+      end
+    end
+
+    def endTagOther(name)
+      @parser.parseError(_("Unexpected end tag token (#{name}) in the after body phase."))
+      @parser.phase = @parser.phases[:inBody]
+      @parser.phase.processEndTag(name)
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/after_frameset_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/after_frameset_phase.rb
new file mode 100644
index 00000000..376c5f38
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/after_frameset_phase.rb
@@ -0,0 +1,34 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class AfterFramesetPhase < Phase
+
+    # http://www.whatwg.org/specs/web-apps/current-work/#after3
+
+    handle_start 'html', 'noframes'
+
+    handle_end 'html'
+
+    def processCharacters(data)
+      @parser.parseError(_('Unexpected non-space characters in the after frameset phase. Ignored.'))
+    end
+
+    def startTagNoframes(name, attributes)
+      @parser.phases[:inBody].processStartTag(name, attributes)
+    end
+
+    def startTagOther(name, attributes)
+      @parser.parseError(_("Unexpected start tag (#{name}) in the after frameset phase. Ignored."))
+    end
+
+    def endTagHtml(name)
+      @parser.lastPhase = @parser.phase
+      @parser.phase = @parser.phases[:trailingEnd]
+    end
+
+    def endTagOther(name)
+      @parser.parseError(_("Unexpected end tag (#{name}) in the after frameset phase. Ignored."))
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/after_head_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/after_head_phase.rb
new file mode 100644
index 00000000..37c8bf6b
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/after_head_phase.rb
@@ -0,0 +1,50 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class AfterHeadPhase < Phase
+  
+    handle_start 'html', 'body', 'frameset', %w( base link meta script style title ) => 'FromHead'
+
+    def processEOF
+      anythingElse
+      @parser.phase.processEOF
+    end
+
+    def processCharacters(data)
+      anythingElse
+      @parser.phase.processCharacters(data)
+    end
+
+    def startTagBody(name, attributes)
+      @tree.insertElement(name, attributes)
+      @parser.phase = @parser.phases[:inBody]
+    end
+
+    def startTagFrameset(name, attributes)
+      @tree.insertElement(name, attributes)
+      @parser.phase = @parser.phases[:inFrameset]
+    end
+
+    def startTagFromHead(name, attributes)
+      @parser.parseError(_("Unexpected start tag (#{name}) that can be in head. Moved."))
+      @parser.phase = @parser.phases[:inHead]
+      @parser.phase.processStartTag(name, attributes)
+    end
+
+    def startTagOther(name, attributes)
+      anythingElse
+      @parser.phase.processStartTag(name, attributes)
+    end
+
+    def processEndTag(name)
+      anythingElse
+      @parser.phase.processEndTag(name)
+    end
+
+    def anythingElse
+      @tree.insertElement('body', {})
+      @parser.phase = @parser.phases[:inBody]
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/before_head_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/before_head_phase.rb
new file mode 100644
index 00000000..87b301a2
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/before_head_phase.rb
@@ -0,0 +1,41 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class BeforeHeadPhase < Phase
+
+    handle_start 'html', 'head'
+
+    handle_end 'html'
+
+    def processEOF
+      startTagHead('head', {})
+      @parser.phase.processEOF
+    end
+
+    def processCharacters(data)
+      startTagHead('head', {})
+      @parser.phase.processCharacters(data)
+    end
+
+    def startTagHead(name, attributes)
+      @tree.insertElement(name, attributes)
+      @tree.headPointer = @tree.openElements[-1]
+      @parser.phase = @parser.phases[:inHead]
+    end
+
+    def startTagOther(name, attributes)
+      startTagHead('head', {})
+      @parser.phase.processStartTag(name, attributes)
+    end
+
+    def endTagHtml(name)
+      startTagHead('head', {})
+      @parser.phase.processEndTag(name)
+    end
+
+    def endTagOther(name)
+      @parser.parseError(_("Unexpected end tag (#{name}) after the (implied) root element."))
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_body_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_body_phase.rb
new file mode 100644
index 00000000..ca6c8cd3
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_body_phase.rb
@@ -0,0 +1,548 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class InBodyPhase < Phase
+
+    # http://www.whatwg.org/specs/web-apps/current-work/#in-body
+
+    handle_start 'html', 'body', 'form', 'plaintext', 'a', 'button', 'xmp', 'table', 'hr', 'image'
+
+    handle_start 'input', 'textarea', 'select', 'isindex', %w( script style ), %w( marquee object )
+
+    handle_start %w( li dd dt ) => 'ListItem', %w( base link meta title ) => 'FromHead'
+      
+    handle_start %w( address blockquote center dir div dl fieldset listing menu ol p pre ul ) => 'CloseP'
+
+    handle_start %w( b big em font i nobr s small strike strong tt u ) => 'Formatting'
+
+    handle_start %w( area basefont bgsound br embed img param spacer wbr ) => 'VoidFormatting'
+
+    handle_start %w( iframe noembed noframes noscript ) => 'Cdata', HEADING_ELEMENTS => 'Heading'
+
+    handle_start %w( caption col colgroup frame frameset head option optgroup tbody td tfoot th thead tr ) => 'Misplaced'
+
+    handle_start %w( event-source section nav article aside header footer datagrid command ) => 'New'
+
+    handle_end 'p', 'body', 'html', 'form', %w( button marquee object ), %w( dd dt li ) => 'ListItem'
+
+    handle_end %w( address blockquote center div dl fieldset listing menu ol pre ul ) => 'Block'
+
+    handle_end %w( a b big em font i nobr s small strike strong tt u ) => 'Formatting'
+
+    handle_end %w( head frameset select optgroup option table caption colgroup col thead tfoot tbody tr td th ) => 'Misplaced' 
+
+    handle_end %w( area basefont bgsound br embed hr image img input isindex param spacer wbr frame ) => 'None'
+
+    handle_end %w( noframes noscript noembed textarea xmp iframe ) => 'CdataTextAreaXmp'
+
+    handle_end %w( event-source section nav article aside header footer datagrid command ) => 'New'
+
+    def initialize(parser, tree)
+      super(parser, tree)
+
+      # for special handling of whitespace in <pre>
+      @processSpaceCharactersPre = false
+    end
+
+    def processSpaceCharactersPre(data)
+      #Sometimes (start of <pre> blocks) we want to drop leading newlines
+      @processSpaceCharactersPre = false
+      if (data.length > 0 and data[0] == ?\n and 
+        @tree.openElements[-1].name == 'pre' and
+        not @tree.openElements[-1].hasContent)
+        data = data[1..-1]
+      end
+      @tree.insertText(data) if data.length > 0
+    end
+
+    def processSpaceCharacters(data)
+      if @processSpaceCharactersPre
+        processSpaceCharactersPre(data)
+      else
+        super(data)
+      end
+    end
+
+    def processCharacters(data)
+      # XXX The specification says to do this for every character at the
+      # moment, but apparently that doesn't match the real world so we don't
+      # do it for space characters.
+      @tree.reconstructActiveFormattingElements
+      @tree.insertText(data)
+    end
+
+    def startTagScriptStyle(name, attributes)
+      @parser.phases[:inHead].processStartTag(name, attributes)
+    end
+
+    def startTagFromHead(name, attributes)
+      @parser.parseError(_("Unexpected start tag (#{name}) that belongs in the head. Moved."))
+      @parser.phases[:inHead].processStartTag(name, attributes)
+    end
+
+    def startTagBody(name, attributes)
+      @parser.parseError(_('Unexpected start tag (body).'))
+
+      if (@tree.openElements.length == 1 or
+        @tree.openElements[1].name != 'body')
+        assert @parser.innerHTML
+      else
+        attributes.each do |attr, value|
+          unless @tree.openElements[1].attributes.has_key?(attr)
+            @tree.openElements[1].attributes[attr] = value
+          end
+        end
+      end
+    end
+
+    def startTagCloseP(name, attributes)
+      endTagP('p') if in_scope?('p')
+      @tree.insertElement(name, attributes)
+      @processSpaceCharactersPre = true if name == 'pre'
+    end
+
+    def startTagForm(name, attributes)
+      if @tree.formPointer
+        @parser.parseError('Unexpected start tag (form). Ignored.')
+      else
+        endTagP('p') if in_scope?('p')
+        @tree.insertElement(name, attributes)
+        @tree.formPointer = @tree.openElements[-1]
+      end
+    end
+
+    def startTagListItem(name, attributes)
+      endTagP('p') if in_scope?('p')
+      stopNames = {'li' => ['li'], 'dd' => ['dd', 'dt'], 'dt' => ['dd', 'dt']}
+      stopName = stopNames[name]
+
+      @tree.openElements.reverse.each_with_index do |node, i|
+        if stopName.include?(node.name)
+          (i + 1).times { @tree.openElements.pop }
+          break
+        end
+
+        # Phrasing elements are all non special, non scoping, non
+        # formatting elements
+        break if ((SPECIAL_ELEMENTS + SCOPING_ELEMENTS).include?(node.name) and
+          not ['address', 'div'].include?(node.name))
+      end
+
+      # Always insert an <li> element.
+      @tree.insertElement(name, attributes)
+    end
+
+    def startTagPlaintext(name, attributes)
+      endTagP('p') if in_scope?('p')
+      @tree.insertElement(name, attributes)
+      @parser.tokenizer.contentModelFlag = :PLAINTEXT
+    end
+
+    def startTagHeading(name, attributes)
+      endTagP('p') if in_scope?('p')
+      HEADING_ELEMENTS.each do |element|
+        if in_scope?(element)
+          @parser.parseError(_("Unexpected start tag (#{name})."))
+        
+          remove_open_elements_until { |element| HEADING_ELEMENTS.include?(element.name) }
+
+          break
+         end
+      end
+      @tree.insertElement(name, attributes)
+    end
+
+    def startTagA(name, attributes)
+      if afeAElement = @tree.elementInActiveFormattingElements('a')
+        @parser.parseError(_('Unexpected start tag (a) implies end tag (a).'))
+        endTagFormatting('a')
+        @tree.openElements.delete(afeAElement) if @tree.openElements.include?(afeAElement)
+        @tree.activeFormattingElements.delete(afeAElement) if @tree.activeFormattingElements.include?(afeAElement)
+      end
+      @tree.reconstructActiveFormattingElements
+      addFormattingElement(name, attributes)
+    end
+
+    def startTagFormatting(name, attributes)
+      @tree.reconstructActiveFormattingElements
+      addFormattingElement(name, attributes)
+    end
+
+    def startTagButton(name, attributes)
+      if in_scope?('button')
+        @parser.parseError(_('Unexpected start tag (button) implied end tag (button).'))
+        processEndTag('button')
+        @parser.phase.processStartTag(name, attributes)
+      else
+        @tree.reconstructActiveFormattingElements
+        @tree.insertElement(name, attributes)
+        @tree.activeFormattingElements.push(Marker)
+      end
+    end
+
+    def startTagMarqueeObject(name, attributes)
+      @tree.reconstructActiveFormattingElements
+      @tree.insertElement(name, attributes)
+      @tree.activeFormattingElements.push(Marker)
+    end
+
+    def startTagXmp(name, attributes)
+      @tree.reconstructActiveFormattingElements
+      @tree.insertElement(name, attributes)
+      @parser.tokenizer.contentModelFlag = :CDATA
+    end
+
+    def startTagTable(name, attributes)
+      processEndTag('p') if in_scope?('p')
+      @tree.insertElement(name, attributes)
+      @parser.phase = @parser.phases[:inTable]
+    end
+
+    def startTagVoidFormatting(name, attributes)
+      @tree.reconstructActiveFormattingElements
+      @tree.insertElement(name, attributes)
+      @tree.openElements.pop
+    end
+
+    def startTagHr(name, attributes)
+      endTagP('p') if in_scope?('p')
+      @tree.insertElement(name, attributes)
+      @tree.openElements.pop
+    end
+
+    def startTagImage(name, attributes)
+      # No really...
+      @parser.parseError(_('Unexpected start tag (image). Treated as img.'))
+      processStartTag('img', attributes)
+    end
+
+    def startTagInput(name, attributes)
+      @tree.reconstructActiveFormattingElements
+      @tree.insertElement(name, attributes)
+      if @tree.formPointer
+        # XXX Not exactly sure what to do here
+        # @tree.openElements[-1].form = @tree.formPointer
+      end
+      @tree.openElements.pop
+    end
+
+    def startTagIsindex(name, attributes)
+      @parser.parseError("Unexpected start tag isindex. Don't use it!")
+      return if @tree.formPointer
+      processStartTag('form', {})
+      processStartTag('hr', {})
+      processStartTag('p', {})
+      processStartTag('label', {})
+      # XXX Localization ...
+      processCharacters('This is a searchable index. Insert your search keywords here:')
+      attributes['name'] = 'isindex'
+      attrs = attributes.to_a
+      processStartTag('input', attributes)
+      processEndTag('label')
+      processEndTag('p')
+      processStartTag('hr', {})
+      processEndTag('form')
+    end
+
+    def startTagTextarea(name, attributes)
+      # XXX Form element pointer checking here as well...
+      @tree.insertElement(name, attributes)
+      @parser.tokenizer.contentModelFlag = :RCDATA
+    end
+
+    # iframe, noembed noframes, noscript(if scripting enabled)
+    def startTagCdata(name, attributes)
+      @tree.insertElement(name, attributes)
+      @parser.tokenizer.contentModelFlag = :CDATA
+    end
+
+    def startTagSelect(name, attributes)
+      @tree.reconstructActiveFormattingElements
+      @tree.insertElement(name, attributes)
+      @parser.phase = @parser.phases[:inSelect]
+    end
+
+    def startTagMisplaced(name, attributes)
+      # Elements that should be children of other elements that have a
+      # different insertion mode; here they are ignored
+      # "caption", "col", "colgroup", "frame", "frameset", "head",
+      # "option", "optgroup", "tbody", "td", "tfoot", "th", "thead",
+      # "tr", "noscript"
+      @parser.parseError(_("Unexpected start tag (#{name}). Ignored."))
+    end
+
+    def startTagNew(name, attributes)
+      # New HTML5 elements, "event-source", "section", "nav",
+      # "article", "aside", "header", "footer", "datagrid", "command"
+      sys.stderr.write("Warning: Undefined behaviour for start tag #{name}")
+      startTagOther(name, attributes)
+      #raise NotImplementedError
+    end
+
+    def startTagOther(name, attributes)
+      @tree.reconstructActiveFormattingElements
+      @tree.insertElement(name, attributes)
+    end
+
+    def endTagP(name)
+      @tree.generateImpliedEndTags('p') if in_scope?('p')
+      @parser.parseError('Unexpected end tag (p).') unless @tree.openElements[-1].name == 'p'
+      @tree.openElements.pop while in_scope?('p')
+    end
+
+    def endTagBody(name)
+      # XXX Need to take open <p> tags into account here. We shouldn't imply
+      # </p> but we should not throw a parse error either. Specification is
+      # likely to be updated.
+      unless @tree.openElements[1].name == 'body'
+        # innerHTML case
+        @parser.parseError
+        return
+      end
+      unless @tree.openElements[-1].name == 'body'
+        @parser.parseError(_("Unexpected end tag (body). Missing end tag (#{@tree.openElements[-1].name})."))
+      end
+      @parser.phase = @parser.phases[:afterBody]
+    end
+
+    def endTagHtml(name)
+      endTagBody(name)
+      @parser.phase.processEndTag(name) unless @parser.innerHTML
+    end
+
+    def endTagBlock(name)
+      #Put us back in the right whitespace handling mode
+      @processSpaceCharactersPre = false if name == 'pre'
+
+      @tree.generateImpliedEndTags if in_scope?(name)
+
+      unless @tree.openElements[-1].name == name
+        @parser.parseError(("End tag (#{name}) seen too early. Expected other end tag."))
+      end
+
+      if in_scope?(name)
+        remove_open_elements_until(name)
+      end
+    end
+
+    def endTagForm(name)
+      endTagBlock(name)
+      @tree.formPointer = nil
+    end
+
+    def endTagListItem(name)
+      # AT Could merge this with the Block case
+      if in_scope?(name)
+        @tree.generateImpliedEndTags(name)
+
+        unless @tree.openElements[-1].name == name
+          @parser.parseError(("End tag (#{name}) seen too early. Expected other end tag."))
+        end
+      end
+
+      remove_open_elements_until(name) if in_scope?(name)
+    end  
+
+    def endTagHeading(name)
+      HEADING_ELEMENTS.each do |element|
+        if in_scope?(element)
+          @tree.generateImpliedEndTags
+          break
+        end
+      end
+
+      unless @tree.openElements[-1].name == name
+        @parser.parseError(("Unexpected end tag (#{name}). Expected other end tag."))
+      end
+
+      HEADING_ELEMENTS.each do |element|
+        if in_scope?(element)
+          remove_open_elements_until { |element| HEADING_ELEMENTS.include?(element.name) }
+          break
+        end
+      end
+    end
+
+    # The much-feared adoption agency algorithm
+    def endTagFormatting(name)
+      # http://www.whatwg.org/specs/web-apps/current-work/#adoptionAgency
+      # XXX Better parseError messages appreciated.
+      while true
+        # Step 1 paragraph 1
+        afeElement = @tree.elementInActiveFormattingElements(name)
+        if not afeElement or (@tree.openElements.include?(afeElement) and not in_scope?(afeElement.name))
+          @parser.parseError(_("End tag (#{name}) violates step 1, paragraph 1 of the adoption agency algorithm."))
+          return
+        # Step 1 paragraph 2
+        elsif not @tree.openElements.include?(afeElement)
+          @parser.parseError(_("End tag (#{name}) violates step 1, paragraph 2 of the adoption agency algorithm."))
+          @tree.activeFormattingElements.delete(afeElement)
+          return
+        end
+
+        # Step 1 paragraph 3
+        if afeElement != @tree.openElements[-1]
+          @parser.parseError(_("End tag (#{name}) violates step 1, paragraph 3 of the adoption agency algorithm."))
+        end
+
+        # Step 2
+        # Start of the adoption agency algorithm proper
+        afeIndex = @tree.openElements.index(afeElement)
+        furthestBlock = nil
+        @tree.openElements[afeIndex..-1].each do |element|
+          if (SPECIAL_ELEMENTS + SCOPING_ELEMENTS).include?(element.name)
+            furthestBlock = element
+            break
+          end
+        end
+
+        # Step 3
+        if furthestBlock.nil?
+          element = remove_open_elements_until { |element| element == afeElement }
+          @tree.activeFormattingElements.delete(element)
+          return
+        end
+        commonAncestor = @tree.openElements[afeIndex - 1]
+
+        # Step 5
+        furthestBlock.parent.removeChild(furthestBlock) if furthestBlock.parent
+
+        # Step 6
+        # The bookmark is supposed to help us identify where to reinsert
+        # nodes in step 12. We have to ensure that we reinsert nodes after
+        # the node before the active formatting element. Note the bookmark
+        # can move in step 7.4
+        bookmark = @tree.activeFormattingElements.index(afeElement)
+
+        # Step 7
+        lastNode = node = furthestBlock
+        while true
+          # AT replace this with a function and recursion?
+          # Node is element before node in open elements
+          node = @tree.openElements[@tree.openElements.index(node) - 1]
+          until @tree.activeFormattingElements.include?(node)
+            tmpNode = node
+            node = @tree.openElements[@tree.openElements.index(node) - 1]
+            @tree.openElements.delete(tmpNode)
+          end
+          # Step 7.3
+          break if node == afeElement
+          # Step 7.4
+          if lastNode == furthestBlock
+            # XXX should this be index(node) or index(node)+1
+            # Anne: I think +1 is ok. Given x = [2,3,4,5]
+            # x.index(3) gives 1 and then x[1 +1] gives 4...
+            bookmark = @tree.activeFormattingElements.index(node) + 1
+          end
+          # Step 7.5
+          cite = node.parent
+          if node.hasContent
+            clone = node.cloneNode
+            # Replace node with clone
+            @tree.activeFormattingElements[@tree.activeFormattingElements.index(node)] = clone
+            @tree.openElements[@tree.openElements.index(node)] = clone
+            node = clone
+          end
+          # Step 7.6
+          # Remove lastNode from its parents, if any
+          lastNode.parent.removeChild(lastNode) if lastNode.parent
+          node.appendChild(lastNode)
+          # Step 7.7
+          lastNode = node
+          # End of inner loop
+        end
+
+        # Step 8
+        lastNode.parent.removeChild(lastNode) if lastNode.parent
+        commonAncestor.appendChild(lastNode)
+
+        # Step 9
+        clone = afeElement.cloneNode
+
+        # Step 10
+        furthestBlock.reparentChildren(clone)
+
+        # Step 11
+        furthestBlock.appendChild(clone)
+
+        # Step 12
+        @tree.activeFormattingElements.delete(afeElement)
+        @tree.activeFormattingElements.insert([bookmark,@tree.activeFormattingElements.length].min, clone)
+
+        # Step 13
+        @tree.openElements.delete(afeElement)
+        @tree.openElements.insert(@tree.openElements.index(furthestBlock) + 1, clone)
+      end
+    end
+
+    def endTagButtonMarqueeObject(name)
+      @tree.generateImpliedEndTags if in_scope?(name)
+
+      unless @tree.openElements[-1].name == name
+        @parser.parseError(_("Unexpected end tag (#{name}). Expected other end tag first."))
+      end
+
+      if in_scope?(name)
+        remove_open_elements_until(name)
+      
+        @tree.clearActiveFormattingElements
+      end
+    end
+
+    def endTagMisplaced(name)
+      # This handles elements with end tags in other insertion modes.
+      @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
+    end
+
+    def endTagNone(name)
+      # This handles elements with no end tag.
+      @parser.parseError(_("This tag (#{name}) has no end tag"))
+    end
+
+    def endTagCdataTextAreaXmp(name)
+      if @tree.openElements[-1].name == name
+        @tree.openElements.pop
+      else
+        @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
+      end
+    end
+
+    def endTagNew(name)
+      # New HTML5 elements, "event-source", "section", "nav",
+      # "article", "aside", "header", "footer", "datagrid", "command"
+      STDERR.puts "Warning: Undefined behaviour for end tag #{name}"
+      endTagOther(name)
+      #raise NotImplementedError
+    end
+
+    def endTagOther(name)
+      # XXX This logic should be moved into the treebuilder
+      @tree.openElements.reverse.each do |node|
+        if node.name == name
+          @tree.generateImpliedEndTags
+
+          unless @tree.openElements[-1].name == name
+            @parser.parseError(_("Unexpected end tag (#{name})."))
+          end
+
+          remove_open_elements_until { |element| element == node }
+
+          break
+        else
+          if (SPECIAL_ELEMENTS + SCOPING_ELEMENTS).include?(node.name)
+            @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
+            break
+          end
+        end
+      end
+    end
+
+    protected
+
+    def addFormattingElement(name, attributes)
+      @tree.insertElement(name, attributes)
+      @tree.activeFormattingElements.push(@tree.openElements[-1])
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_caption_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_caption_phase.rb
new file mode 100644
index 00000000..ccdfcb91
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_caption_phase.rb
@@ -0,0 +1,68 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class InCaptionPhase < Phase
+
+    # http://www.whatwg.org/specs/web-apps/current-work/#in-caption
+
+    handle_start 'html', %w( caption col colgroup tbody td tfoot th thead tr ) => 'TableElement'
+
+    handle_end 'caption', 'table', %w( body col colgroup html tbody td tfoot th thead tr ) => 'Ignore'
+
+    def ignoreEndTagCaption
+      not in_scope?('caption', true)
+    end
+
+    def processCharacters(data)
+      @parser.phases[:inBody].processCharacters(data)
+    end
+
+    def startTagTableElement(name, attributes)
+      @parser.parseError
+      #XXX Have to duplicate logic here to find out if the tag is ignored
+      ignoreEndTag = ignoreEndTagCaption
+      @parser.phase.processEndTag('caption')
+      @parser.phase.processStartTag(name, attributes) unless ignoreEndTag
+    end
+
+    def startTagOther(name, attributes)
+      @parser.phases[:inBody].processStartTag(name, attributes)
+    end
+
+    def endTagCaption(name)
+      if ignoreEndTagCaption
+        # innerHTML case
+        assert @parser.innerHTML
+        @parser.parseError
+      else
+        # AT this code is quite similar to endTagTable in "InTable"
+        @tree.generateImpliedEndTags
+
+        unless @tree.openElements[-1].name == 'caption'
+          @parser.parseError(_("Unexpected end tag (caption). Missing end tags."))
+        end
+
+        remove_open_elements_until('caption')
+
+        @tree.clearActiveFormattingElements
+        @parser.phase = @parser.phases[:inTable]
+      end
+    end
+
+    def endTagTable(name)
+      @parser.parseError
+      ignoreEndTag = ignoreEndTagCaption
+      @parser.phase.processEndTag('caption')
+      @parser.phase.processEndTag(name) unless ignoreEndTag
+    end
+
+    def endTagIgnore(name)
+      @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
+    end
+
+    def endTagOther(name)
+      @parser.phases[:inBody].processEndTag(name)
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_cell_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_cell_phase.rb
new file mode 100644
index 00000000..5b88a30b
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_cell_phase.rb
@@ -0,0 +1,78 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class InCellPhase < Phase
+
+    # http://www.whatwg.org/specs/web-apps/current-work/#in-cell
+
+    handle_start 'html', %w( caption col colgroup tbody td tfoot th thead tr ) => 'TableOther'
+
+    handle_end %w( td th ) => 'TableCell', %w( body caption col colgroup html ) => 'Ignore'
+
+    handle_end %w( table tbody tfoot thead tr ) => 'Imply'
+
+    def processCharacters(data)
+      @parser.phases[:inBody].processCharacters(data)
+    end
+
+    def startTagTableOther(name, attributes)
+      if in_scope?('td', true) or in_scope?('th', true)
+        closeCell
+        @parser.phase.processStartTag(name, attributes)
+      else
+        # innerHTML case
+        @parser.parseError
+      end
+    end
+
+    def startTagOther(name, attributes)
+      @parser.phases[:inBody].processStartTag(name, attributes)
+    end
+
+    def endTagTableCell(name)
+      if in_scope?(name, true)
+        @tree.generateImpliedEndTags(name)
+        if @tree.openElements[-1].name != name
+          @parser.parseError("Got table cell end tag (#{name}) while required end tags are missing.")
+
+          remove_open_elements_until(name)
+        else
+          @tree.openElements.pop
+        end
+        @tree.clearActiveFormattingElements
+        @parser.phase = @parser.phases[:inRow]
+      else
+        @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
+      end
+    end
+
+    def endTagIgnore(name)
+      @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
+    end
+
+    def endTagImply(name)
+      if in_scope?(name, true)
+        closeCell
+        @parser.phase.processEndTag(name)
+      else
+        # sometimes innerHTML case
+        @parser.parseError
+      end
+    end
+
+    def endTagOther(name)
+      @parser.phases[:inBody].processEndTag(name)
+    end
+
+    protected
+
+    def closeCell
+      if in_scope?('td', true)
+        endTagTableCell('td')
+      elsif in_scope?('th', true)
+        endTagTableCell('th')
+      end
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_column_group_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_column_group_phase.rb
new file mode 100644
index 00000000..7729eb83
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_column_group_phase.rb
@@ -0,0 +1,55 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class InColumnGroupPhase < Phase
+
+    # http://www.whatwg.org/specs/web-apps/current-work/#in-column
+
+    handle_start 'html', 'col'
+
+    handle_end 'colgroup', 'col'
+
+    def ignoreEndTagColgroup
+      @tree.openElements[-1].name == 'html'
+    end
+
+    def processCharacters(data)
+      ignoreEndTag = ignoreEndTagColgroup
+      endTagColgroup("colgroup")
+      @parser.phase.processCharacters(data) unless ignoreEndTag
+    end
+
+    def startTagCol(name, attributes)
+      @tree.insertElement(name, attributes)
+      @tree.openElements.pop
+    end
+
+    def startTagOther(name, attributes)
+      ignoreEndTag = ignoreEndTagColgroup
+      endTagColgroup('colgroup')
+      @parser.phase.processStartTag(name, attributes) unless ignoreEndTag
+    end
+
+    def endTagColgroup(name)
+      if ignoreEndTagColgroup
+        # innerHTML case
+        assert @parser.innerHTML
+        @parser.parseError
+      else
+        @tree.openElements.pop
+        @parser.phase = @parser.phases[:inTable]
+      end
+    end
+
+    def endTagCol(name)
+      @parser.parseError(_('Unexpected end tag (col). col has no end tag.'))
+    end
+
+    def endTagOther(name)
+      ignoreEndTag = ignoreEndTagColgroup
+      endTagColgroup('colgroup')
+      @parser.phase.processEndTag(name) unless ignoreEndTag
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_frameset_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_frameset_phase.rb
new file mode 100644
index 00000000..d6c7400c
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_frameset_phase.rb
@@ -0,0 +1,57 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class InFramesetPhase < Phase
+
+    # http://www.whatwg.org/specs/web-apps/current-work/#in-frameset
+
+    handle_start 'html', 'frameset', 'frame', 'noframes'
+
+    handle_end 'frameset', 'noframes'
+
+    def processCharacters(data)
+      @parser.parseError(_('Unexpected characters in the frameset phase. Characters ignored.'))
+    end
+
+    def startTagFrameset(name, attributes)
+      @tree.insertElement(name, attributes)
+    end
+
+    def startTagFrame(name, attributes)
+      @tree.insertElement(name, attributes)
+      @tree.openElements.pop
+    end
+
+    def startTagNoframes(name, attributes)
+      @parser.phases[:inBody].processStartTag(name, attributes)
+    end
+
+    def startTagOther(name, attributes)
+      @parser.parseError(_("Unexpected start tag token (#{name}) in the frameset phase. Ignored"))
+    end
+
+    def endTagFrameset(name)
+      if @tree.openElements[-1].name == 'html'
+        # innerHTML case
+        @parser.parseError(_("Unexpected end tag token (frameset) in the frameset phase (innerHTML)."))
+      else
+        @tree.openElements.pop
+      end
+      if (not @parser.innerHTML and
+        @tree.openElements[-1].name != 'frameset')
+        # If we're not in innerHTML mode and the the current node is not a
+        # "frameset" element (anymore) then switch.
+        @parser.phase = @parser.phases[:afterFrameset]
+      end
+    end
+
+    def endTagNoframes(name)
+      @parser.phases[:inBody].processEndTag(name)
+    end
+
+    def endTagOther(name)
+      @parser.parseError(_("Unexpected end tag token (#{name}) in the frameset phase. Ignored."))
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_head_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_head_phase.rb
new file mode 100644
index 00000000..4060114a
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_head_phase.rb
@@ -0,0 +1,120 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class InHeadPhase < Phase
+
+    handle_start 'html', 'head', 'title', 'style', 'script', %w( base link meta )
+
+    handle_end 'head', 'html', %w( title style script )
+
+    def processEOF
+      if ['title', 'style', 'script'].include?(name = @tree.openElements[-1].name)
+        @parser.parseError(_("Unexpected end of file. Expected end tag (#{name})."))
+        @tree.openElements.pop
+      end
+      anythingElse
+      @parser.phase.processEOF
+    end
+
+    def processCharacters(data)
+      if ['title', 'style', 'script'].include?(@tree.openElements[-1].name)
+        @tree.insertText(data)
+      else
+        anythingElse
+        @parser.phase.processCharacters(data)
+      end
+    end
+
+    def startTagHead(name, attributes)
+      @parser.parseError(_('Unexpected start tag head in existing head. Ignored'))
+    end
+
+    def startTagTitle(name, attributes)
+      element = @tree.createElement(name, attributes)
+      appendToHead(element)
+      @tree.openElements.push(element)
+      @parser.tokenizer.contentModelFlag = :RCDATA
+    end
+
+    def startTagStyle(name, attributes)
+      element = @tree.createElement(name, attributes)
+      if @tree.headPointer != nil and @parser.phase == @parser.phases[:inHead]
+        appendToHead(element)
+      else
+        @tree.openElements[-1].appendChild(element)
+      end
+      @tree.openElements.push(element)
+      @parser.tokenizer.contentModelFlag = :CDATA
+    end
+
+    def startTagScript(name, attributes)
+      #XXX Inner HTML case may be wrong
+      element = @tree.createElement(name, attributes)
+      element._flags.push("parser-inserted")
+      if (@tree.headPointer != nil and
+        @parser.phase == @parser.phases[:inHead])
+        appendToHead(element)
+      else
+        @tree.openElements[-1].appendChild(element)
+      end
+      @tree.openElements.push(element)
+      @parser.tokenizer.contentModelFlag = :CDATA
+    end
+
+    def startTagBaseLinkMeta(name, attributes)
+      element = @tree.createElement(name, attributes)
+      appendToHead(element)
+    end
+
+    def startTagOther(name, attributes)
+      anythingElse
+      @parser.phase.processStartTag(name, attributes)
+    end
+
+    def endTagHead(name)
+      if @tree.openElements[-1].name == 'head'
+        @tree.openElements.pop
+      else
+        @parser.parseError(_("Unexpected end tag (head). Ignored."))
+      end
+      @parser.phase = @parser.phases[:afterHead]
+    end
+
+    def endTagHtml(name)
+      anythingElse
+      @parser.phase.processEndTag(name)
+    end
+
+    def endTagTitleStyleScript(name)
+      if @tree.openElements[-1].name == name
+        @tree.openElements.pop
+      else
+        @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
+      end
+    end
+
+    def endTagOther(name)
+      @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
+    end
+
+    def anythingElse
+      if @tree.openElements[-1].name == 'head'
+        endTagHead('head')
+      else
+        @parser.phase = @parser.phases[:afterHead]
+      end
+    end
+
+    protected
+
+    def appendToHead(element)
+      if @tree.headPointer.nil?
+        assert @parser.innerHTML
+        @tree.openElements[-1].appendChild(element)
+      else
+        @tree.headPointer.appendChild(element)
+      end
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_row_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_row_phase.rb
new file mode 100644
index 00000000..b3ffa3f0
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_row_phase.rb
@@ -0,0 +1,87 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class InRowPhase < Phase
+
+    # http://www.whatwg.org/specs/web-apps/current-work/#in-row
+
+    handle_start 'html', %w( td th ) => 'TableCell', %w( caption col colgroup tbody tfoot thead tr ) => 'TableOther'
+
+    handle_end 'tr', 'table', %w( tbody tfoot thead ) => 'TableRowGroup', %w( body caption col colgroup html td th ) => 'Ignore'
+
+    def processCharacters(data)
+      @parser.phases[:inTable].processCharacters(data)
+    end
+
+    def startTagTableCell(name, attributes)
+      clearStackToTableRowContext
+      @tree.insertElement(name, attributes)
+      @parser.phase = @parser.phases[:inCell]
+      @tree.activeFormattingElements.push(Marker)
+    end
+
+    def startTagTableOther(name, attributes)
+      ignoreEndTag = ignoreEndTagTr
+      endTagTr('tr')
+      # XXX how are we sure it's always ignored in the innerHTML case?
+      @parser.phase.processStartTag(name, attributes) unless ignoreEndTag
+    end
+
+    def startTagOther(name, attributes)
+      @parser.phases[:inTable].processStartTag(name, attributes)
+    end
+
+    def endTagTr(name)
+      if ignoreEndTagTr
+        # innerHTML case
+        assert @parser.innerHTML
+        @parser.parseError
+      else
+        clearStackToTableRowContext
+        @tree.openElements.pop
+        @parser.phase = @parser.phases[:inTableBody]
+      end
+    end
+
+    def endTagTable(name)
+      ignoreEndTag = ignoreEndTagTr
+      endTagTr('tr')
+      # Reprocess the current tag if the tr end tag was not ignored
+      # XXX how are we sure it's always ignored in the innerHTML case?
+      @parser.phase.processEndTag(name) unless ignoreEndTag
+    end
+
+    def endTagTableRowGroup(name)
+      if in_scope?(name, true)
+        endTagTr('tr')
+        @parser.phase.processEndTag(name)
+      else
+        # innerHTML case
+        @parser.parseError
+      end
+    end
+
+    def endTagIgnore(name)
+      @parser.parseError(_("Unexpected end tag (#{name}) in the row phase. Ignored."))
+    end
+
+    def endTagOther(name)
+      @parser.phases[:inTable].processEndTag(name)
+    end
+
+    protected
+
+    # XXX unify this with other table helper methods
+    def clearStackToTableRowContext
+      until ['tr', 'html'].include?(name = @tree.openElements[-1].name)
+        @parser.parseError(_("Unexpected implied end tag (#{name}) in the row phase."))
+        @tree.openElements.pop
+      end
+    end
+
+    def ignoreEndTagTr
+      not in_scope?('tr', :tableVariant => true)
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_select_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_select_phase.rb
new file mode 100644
index 00000000..850b8f9f
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_select_phase.rb
@@ -0,0 +1,84 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class InSelectPhase < Phase
+
+    # http://www.whatwg.org/specs/web-apps/current-work/#in-select
+
+    handle_start 'html', 'option', 'optgroup', 'select'
+
+    handle_end 'option', 'optgroup', 'select', %w( caption table tbody tfoot thead tr td th ) => 'TableElements'
+
+    def processCharacters(data)
+      @tree.insertText(data)
+    end
+
+    def startTagOption(name, attributes)
+      # We need to imply </option> if <option> is the current node.
+      @tree.openElements.pop if @tree.openElements[-1].name == 'option'
+      @tree.insertElement(name, attributes)
+    end
+
+    def startTagOptgroup(name, attributes)
+      @tree.openElements.pop if @tree.openElements[-1].name == 'option'
+      @tree.openElements.pop if @tree.openElements[-1].name == 'optgroup'
+      @tree.insertElement(name, attributes)
+    end
+
+    def startTagSelect(name, attributes)
+      @parser.parseError(_('Unexpected start tag (select) in the select phase implies select start tag.'))
+      endTagSelect('select')
+    end
+
+    def startTagOther(name, attributes)
+      @parser.parseError(_('Unexpected start tag token (#{name}) in the select phase. Ignored.'))
+    end
+
+    def endTagOption(name)
+      if @tree.openElements[-1].name == 'option'
+        @tree.openElements.pop
+      else
+        @parser.parseError(_('Unexpected end tag (option) in the select phase. Ignored.'))
+      end
+    end
+
+    def endTagOptgroup(name)
+      # </optgroup> implicitly closes <option>
+      if @tree.openElements[-1].name == 'option' and @tree.openElements[-2].name == 'optgroup'
+        @tree.openElements.pop
+      end
+      # It also closes </optgroup>
+      if @tree.openElements[-1].name == 'optgroup'
+        @tree.openElements.pop
+      # But nothing else
+      else
+        @parser.parseError(_('Unexpected end tag (optgroup) in the select phase. Ignored.'))
+      end
+    end
+
+    def endTagSelect(name)
+      if in_scope?('select', true)
+        remove_open_elements_until('select')
+
+        @parser.resetInsertionMode
+      else
+        # innerHTML case
+        @parser.parseError
+      end
+    end
+
+    def endTagTableElements(name)
+      @parser.parseError(_("Unexpected table end tag (#{name}) in the select phase."))
+
+      if in_scope?(name, true)
+        endTagSelect('select')
+        @parser.phase.processEndTag(name)
+      end
+    end
+
+    def endTagOther(name)
+      @parser.parseError(_("Unexpected end tag token (#{name}) in the select phase. Ignored."))
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_table_body_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_table_body_phase.rb
new file mode 100644
index 00000000..79448216
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_table_body_phase.rb
@@ -0,0 +1,83 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class InTableBodyPhase < Phase
+
+    # http://www.whatwg.org/specs/web-apps/current-work/#in-table0
+
+    handle_start 'html', 'tr', %w( td th ) => 'TableCell', %w( caption col colgroup tbody tfoot thead ) => 'TableOther'
+
+    handle_end 'table', %w( tbody tfoot thead ) => 'TableRowGroup', %w( body caption col colgroup html td th tr ) => 'Ingore'
+
+    def processCharacters(data)
+      @parser.phases[:inTable].processCharacters(data)
+    end
+
+    def startTagTr(name, attributes)
+      clearStackToTableBodyContext
+      @tree.insertElement(name, attributes)
+      @parser.phase = @parser.phases[:inRow]
+    end
+
+    def startTagTableCell(name, attributes)
+      @parser.parseError(_("Unexpected table cell start tag (#{name}) in the table body phase."))
+      startTagTr('tr', {})
+      @parser.phase.processStartTag(name, attributes)
+    end
+
+    def startTagTableOther(name, attributes)
+      # XXX AT Any ideas on how to share this with endTagTable?
+      if in_scope?('tbody', true) or in_scope?('thead', true) or in_scope?('tfoot', true)
+        clearStackToTableBodyContext
+        endTagTableRowGroup(@tree.openElements[-1].name)
+        @parser.phase.processStartTag(name, attributes)
+      else
+        # innerHTML case
+        @parser.parseError
+      end
+    end
+
+    def startTagOther(name, attributes)
+      @parser.phases[:inTable].processStartTag(name, attributes)
+    end
+
+    def endTagTableRowGroup(name)
+      if in_scope?(name, true)
+        clearStackToTableBodyContext
+        @tree.openElements.pop
+        @parser.phase = @parser.phases[:inTable]
+      else
+        @parser.parseError(_("Unexpected end tag (#{name}) in the table body phase. Ignored."))
+      end
+    end
+
+    def endTagTable(name)
+      if in_scope?('tbody', true) or in_scope?('thead', true) or in_scope?('tfoot', true)
+        clearStackToTableBodyContext
+        endTagTableRowGroup(@tree.openElements[-1].name)
+        @parser.phase.processEndTag(name)
+      else
+        # innerHTML case
+        @parser.parseError
+      end
+    end
+
+    def endTagIgnore(name)
+      @parser.parseError(_("Unexpected end tag (#{name}) in the table body phase. Ignored."))
+    end
+
+    def endTagOther(name)
+      @parser.phases[:inTable].processEndTag(name)
+    end
+
+    protected
+
+    def clearStackToTableBodyContext
+      until ['tbody', 'tfoot', 'thead', 'html'].include?(name = @tree.openElements[-1].name)
+        @parser.parseError(_("Unexpected implied end tag (#{name}) in the table body phase."))
+        @tree.openElements.pop
+      end
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_table_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_table_phase.rb
new file mode 100644
index 00000000..c4b86039
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/in_table_phase.rb
@@ -0,0 +1,110 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class InTablePhase < Phase
+
+    # http://www.whatwg.org/specs/web-apps/current-work/#in-table
+
+    handle_start 'html', 'caption', 'colgroup', 'col', 'table'
+
+    handle_start %w( tbody tfoot thead ) => 'RowGroup', %w( td th tr ) => 'ImplyTbody'
+
+    handle_end 'table', %w( body caption col colgroup html tbody td tfoot th thead tr ) => 'Ignore'
+
+    def processCharacters(data)
+      @parser.parseError(_("Unexpected non-space characters in table context caused voodoo mode."))
+      # Make all the special element rearranging voodoo kick in
+      @tree.insertFromTable = true
+      # Process the character in the "in body" mode
+      @parser.phases[:inBody].processCharacters(data)
+      @tree.insertFromTable = false
+    end
+
+    def startTagCaption(name, attributes)
+      clearStackToTableContext
+      @tree.activeFormattingElements.push(Marker)
+      @tree.insertElement(name, attributes)
+      @parser.phase = @parser.phases[:inCaption]
+    end
+
+    def startTagColgroup(name, attributes)
+      clearStackToTableContext
+      @tree.insertElement(name, attributes)
+      @parser.phase = @parser.phases[:inColumnGroup]
+    end
+
+    def startTagCol(name, attributes)
+      startTagColgroup('colgroup', {})
+      @parser.phase.processStartTag(name, attributes)
+    end
+
+    def startTagRowGroup(name, attributes)
+      clearStackToTableContext
+      @tree.insertElement(name, attributes)
+      @parser.phase = @parser.phases[:inTableBody]
+    end
+
+    def startTagImplyTbody(name, attributes)
+      startTagRowGroup('tbody', {})
+      @parser.phase.processStartTag(name, attributes)
+    end
+
+    def startTagTable(name, attributes)
+      @parser.parseError(_("Unexpected start tag (table) in table phase. Implies end tag (table)."))
+      @parser.phase.processEndTag('table')
+      @parser.phase.processStartTag(name, attributes) unless @parser.innerHTML
+    end
+
+    def startTagOther(name, attributes)
+      @parser.parseError(_("Unexpected start tag (#{name}) in table context caused voodoo mode."))
+      # Make all the special element rearranging voodoo kick in
+      @tree.insertFromTable = true
+      # Process the start tag in the "in body" mode
+      @parser.phases[:inBody].processStartTag(name, attributes)
+      @tree.insertFromTable = false
+    end
+
+    def endTagTable(name)
+      if in_scope?('table', true)
+        @tree.generateImpliedEndTags
+      
+        unless @tree.openElements[-1].name == 'table'
+          @parser.parseError(_("Unexpected end tag (table). Expected end tag (#{@tree.openElements[-1].name})."))
+        end
+      
+        remove_open_elements_until('table')
+
+        @parser.resetInsertionMode
+      else
+        # innerHTML case
+        assert @parser.innerHTML
+        @parser.parseError
+      end
+    end
+
+    def endTagIgnore(name)
+      @parser.parseError(_("Unexpected end tag (#{name}). Ignored."))
+    end
+
+    def endTagOther(name)
+      @parser.parseError(_("Unexpected end tag (#{name}) in table context caused voodoo mode."))
+      # Make all the special element rearranging voodoo kick in
+      @parser.insertFromTable = true
+      # Process the end tag in the "in body" mode
+      @parser.phases[:inBody].processEndTag(name)
+      @parser.insertFromTable = false
+    end
+
+    protected
+
+    def clearStackToTableContext
+      # "clear the stack back to a table context"
+      until ['table', 'html'].include?(name = @tree.openElements[-1].name)
+        @parser.parseError(_("Unexpected implied end tag (#{name}) in the table phase."))
+        @tree.openElements.pop
+      end
+      # When the current node is <html> it's an innerHTML case
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/initial_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/initial_phase.rb
new file mode 100644
index 00000000..9914543b
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/initial_phase.rb
@@ -0,0 +1,49 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class InitialPhase < Phase
+
+    # This phase deals with error handling as well which is currently not
+    # covered in the specification. The error handling is typically known as
+    # "quirks mode". It is expected that a future version of HTML5 will define this.
+
+    def processEOF
+      @parser.parseError(_('Unexpected End of file. Expected DOCTYPE.'))
+      @parser.phase = @parser.phases[:rootElement]
+      @parser.phase.processEOF
+    end
+
+    def processComment(data)
+      @tree.insertComment(data, @tree.document)
+    end
+
+    def processDoctype(name, error)
+      @parser.parseError(_('Erroneous DOCTYPE.')) if error
+      @tree.insertDoctype(name)
+      @parser.phase = @parser.phases[:rootElement]
+    end
+
+    def processSpaceCharacters(data)
+      @tree.insertText(data, @tree.document)
+    end
+
+    def processCharacters(data)
+      @parser.parseError(_('Unexpected non-space characters. Expected DOCTYPE.'))
+      @parser.phase = @parser.phases[:rootElement]
+      @parser.phase.processCharacters(data)
+    end
+
+    def processStartTag(name, attributes)
+      @parser.parseError(_("Unexpected start tag (#{name}). Expected DOCTYPE."))
+      @parser.phase = @parser.phases[:rootElement]
+      @parser.phase.processStartTag(name, attributes)
+    end
+
+    def processEndTag(name)
+      @parser.parseError(_("Unexpected end tag (#{name}). Expected DOCTYPE."))
+      @parser.phase = @parser.phases[:rootElement]
+      @parser.phase.processEndTag(name)
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/phase.rb
new file mode 100644
index 00000000..3a96b66f
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/phase.rb
@@ -0,0 +1,156 @@
+module HTML5lib
+  # Base class for helper objects that implement each phase of processing.
+  #
+  # Handler methods should be in the following order (they can be omitted):
+  #
+  #   * EOF
+  #   * Comment
+  #   * Doctype
+  #   * SpaceCharacters
+  #   * Characters
+  #   * StartTag
+  #     - startTag* methods
+  #   * EndTag
+  #     - endTag* methods
+  #
+  class Phase
+
+    # The following example call:
+    #
+    #   tag_handlers('startTag', 'html', %( base link meta ), %( li dt dd ) => 'ListItem')
+    #
+    # ...would return a hash equal to this:
+    #
+    #   { 'html' => 'startTagHtml',
+    #     'base' => 'startTagBaseLinkMeta',
+    #     'link' => 'startTagBaseLinkMeta',
+    #     'meta' => 'startTagBaseLinkMeta',
+    #     'li'   => 'startTagListItem',
+    #     'dt'   => 'startTagListItem',
+    #     'dd'   => 'startTagListItem'  }
+    #
+    def self.tag_handlers(prefix, *tags)
+      mapping = {}
+      if tags.last.is_a?(Hash)
+        tags.pop.each do |names, handler_method_suffix|
+          handler_method = prefix + handler_method_suffix
+          Array(names).each { |name| mapping[name] = handler_method }
+        end
+      end
+      tags.each do |names|
+        names = Array(names)
+        handler_method = prefix + names.map { |name| name.capitalize }.join
+        names.each { |name| mapping[name] = handler_method }
+      end
+      return mapping
+    end
+
+    def self.start_tag_handlers
+      @start_tag_handlers ||= Hash.new('startTagOther')
+    end
+
+    # Declare what start tags this Phase handles. Can be called more than once.
+    #
+    # Example usage:
+    #
+    #   handle_start 'html'
+    #   # html start tags will be handled by a method named 'startTagHtml'
+    #
+    #   handle_start %( base link meta )
+    #   # base, link and meta start tags will be handled by a method named 'startTagBaseLinkMeta'
+    #
+    #   handle_start %( li dt dd ) => 'ListItem'
+    #   # li, dt, and dd start tags will be handled by a method named 'startTagListItem'
+    #
+    def self.handle_start(*tags)
+      start_tag_handlers.update tag_handlers('startTag', *tags)
+    end
+
+    def self.end_tag_handlers
+      @end_tag_handlers ||= Hash.new('endTagOther')
+    end
+
+    # Declare what end tags this Phase handles. Behaves like handle_start.
+    #
+    def self.handle_end(*tags)
+      end_tag_handlers.update tag_handlers('endTag', *tags)
+    end
+
+    def initialize(parser, tree)
+      @parser, @tree = parser, tree
+    end
+
+    def processEOF
+      @tree.generateImpliedEndTags
+
+      if @tree.openElements.length > 2
+        @parser.parseError(_('Unexpected end of file. Missing closing tags.'))
+      elsif @tree.openElements.length == 2 and @tree.openElements[1].name != 'body'
+        # This happens for framesets or something?
+        @parser.parseError(_("Unexpected end of file. Expected end tag (#{@tree.openElements[1].name}) first."))
+      elsif @parser.innerHTML and @tree.openElements.length > 1 
+        # XXX This is not what the specification says. Not sure what to do here.
+        @parser.parseError(_('XXX innerHTML EOF'))
+      end
+      # Betting ends.
+    end
+
+    def processComment(data)
+      # For most phases the following is correct. Where it's not it will be
+      # overridden.
+      @tree.insertComment(data, @tree.openElements[-1])
+    end
+
+    def processDoctype(name, error)
+      @parser.parseError(_('Unexpected DOCTYPE. Ignored.'))
+    end
+
+    def processSpaceCharacters(data)
+      @tree.insertText(data)
+    end
+
+    def processStartTag(name, attributes)
+      send self.class.start_tag_handlers[name], name, attributes
+    end
+
+    def startTagHtml(name, attributes)
+      if @parser.firstStartTag == false and name == 'html'
+         @parser.parseError(_('html needs to be the first start tag.'))
+      end
+      # XXX Need a check here to see if the first start tag token emitted is
+      # this token... If it's not, invoke @parser.parseError.
+      attributes.each do |attr, value|
+        unless @tree.openElements[0].attributes.has_key?(attr)
+          @tree.openElements[0].attributes[attr] = value
+        end
+      end
+      @parser.firstStartTag = false
+    end
+
+    def processEndTag(name)
+      send self.class.end_tag_handlers[name], name
+    end
+
+    def _(string)
+      string
+    end
+
+    def assert(value)
+      throw AssertionError.new unless value
+    end
+
+    def in_scope?(*args)
+      @tree.elementInScope(*args)
+    end
+
+    def remove_open_elements_until(name=nil)
+      finished = false
+      until finished
+        element = @tree.openElements.pop
+        finished = name.nil?? yield(element) : element.name == name
+      end
+      return element
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/root_element_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/root_element_phase.rb
new file mode 100644
index 00000000..7a4b67c8
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/root_element_phase.rb
@@ -0,0 +1,43 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class RootElementPhase < Phase
+
+    def processEOF
+      insertHtmlElement
+      @parser.phase.processEOF
+    end
+
+    def processComment(data)
+      @tree.insertComment(data, @tree.document)
+    end
+
+    def processSpaceCharacters(data)
+      @tree.insertText(data, @tree.document)
+    end
+
+    def processCharacters(data)
+      insertHtmlElement
+      @parser.phase.processCharacters(data)
+    end
+
+    def processStartTag(name, attributes)
+      @parser.firstStartTag = true if name == 'html'
+      insertHtmlElement
+      @parser.phase.processStartTag(name, attributes)
+    end
+
+    def processEndTag(name)
+      insertHtmlElement
+      @parser.phase.processEndTag(name)
+    end
+
+    def insertHtmlElement
+      element = @tree.createElement('html', {})
+      @tree.openElements.push(element)
+      @tree.document.appendChild(element)
+      @parser.phase = @parser.phases[:beforeHead]
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/html5parser/trailing_end_phase.rb b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/trailing_end_phase.rb
new file mode 100644
index 00000000..f8f8d33a
--- /dev/null
+++ b/vendor/plugins/HTML5lib/lib/html5lib/html5parser/trailing_end_phase.rb
@@ -0,0 +1,36 @@
+require 'html5lib/html5parser/phase'
+
+module HTML5lib
+  class TrailingEndPhase < Phase
+
+    def processEOF
+    end
+
+    def processComment(data)
+      @tree.insertComment(data, @tree.document)
+    end
+
+    def processSpaceCharacters(data)
+      @parser.lastPhase.processSpaceCharacters(data)
+    end
+
+    def processCharacters(data)
+      @parser.parseError(_('Unexpected non-space characters. Expected end of file.'))
+      @parser.phase = @parser.lastPhase
+      @parser.phase.processCharacters(data)
+    end
+
+    def processStartTag(name, attributes)
+      @parser.parseError(_('Unexpected start tag (#{name}). Expected end of file.'))
+      @parser.phase = @parser.lastPhase
+      @parser.phase.processStartTag(name, attributes)
+    end
+
+    def processEndTag(name)
+      @parser.parseError(_('Unexpected end tag (#{name}). Expected end of file.'))
+      @parser.phase = @parser.lastPhase
+      @parser.phase.processEndTag(name)
+    end
+
+  end
+end
\ No newline at end of file
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/inputstream.rb b/vendor/plugins/HTML5lib/lib/html5lib/inputstream.rb
index 7a7349c8..62cc9948 100755
--- a/vendor/plugins/HTML5lib/lib/html5lib/inputstream.rb
+++ b/vendor/plugins/HTML5lib/lib/html5lib/inputstream.rb
@@ -3,14 +3,14 @@ require 'html5lib/constants'
 
 module HTML5lib
 
-# Provides a unicode stream of characters to the HTMLTokenizer.
+  # Provides a unicode stream of characters to the HTMLTokenizer.
 
-# This class takes care of character encoding and removing or replacing
-# incorrect byte-sequences and also provides column and line tracking.
+  # This class takes care of character encoding and removing or replacing
+  # incorrect byte-sequences and also provides column and line tracking.
 
-class HTMLInputStream
+  class HTMLInputStream
 
-    attr_accessor :queue, :charEncoding
+    attr_accessor :queue, :char_encoding
 
     # Initialises the HTMLInputStream.
     # 
@@ -27,523 +27,524 @@ class HTMLInputStream
     # parseMeta - Look for a <meta> element containing encoding information
 
     def initialize(source, options = {})
-        @encoding = nil
-        @parseMeta = true
-        @chardet = true
+      @encoding = nil
+      @parse_meta = true
+      @chardet = true
 
-        options.each { |name, value| instance_variable_set("@#{name}", value) }
+      options.each { |name, value| instance_variable_set("@#{name}", value) }
 
-        # List of where new lines occur
-        @newLines = []
+      # List of where new lines occur
+      @new_lines = []
 
-        # Raw Stream
-        @rawStream = openStream(source)
+      # Raw Stream
+      @raw_stream = open_stream(source)
 
-        # Encoding Information
-        #Number of bytes to use when looking for a meta element with
-        #encoding information
-        @NUM_BYTES_META = 512
-        #Encoding to use if no other information can be found
-        @DEFAULT_ENCODING = 'windows-1252'
-        
-        #Detect encoding iff no explicit "transport level" encoding is supplied
-        if @encoding.nil? or not HTML5lib.isValidEncoding(@encoding)
-            @charEncoding = detectEncoding
-        else
-            @charEncoding = @encoding
+      # Encoding Information
+      #Number of bytes to use when looking for a meta element with
+      #encoding information
+      @NUM_BYTES_META = 512
+      #Encoding to use if no other information can be found
+      @DEFAULT_ENCODING = 'windows-1252'
+    
+      #Detect encoding iff no explicit "transport level" encoding is supplied
+      if @encoding.nil? or not HTML5lib.is_valid_encoding(@encoding)
+        @char_encoding = detect_encoding
+      else
+        @char_encoding = @encoding
+      end
+
+      # Read bytes from stream decoding them into Unicode
+      uString = @raw_stream.read
+      unless @char_encoding == 'utf-8'
+        begin
+          require 'iconv'
+          uString = Iconv.iconv('utf-8', @encoding, uString)[0]
+        rescue
         end
+      end
 
-        # Read bytes from stream decoding them into Unicode
-        uString = @rawStream.read
-        unless @charEncoding == 'utf-8'
-            begin
-                require 'iconv'
-                uString = Iconv.iconv('utf-8', @encoding, uString)[0]
-            rescue
-            end
-        end
+      # Normalize newlines and null characters
+      uString.gsub!(/\r\n?/, "\n")
+      uString.gsub!("\x00", [0xFFFD].pack('U'))
 
-        # Normalize newlines and null characters
-        uString.gsub!(/\r\n?/, "\n")
-        uString.gsub!("\x00", [0xFFFD].pack('U'))
+      # Convert the unicode string into a list to be used as the data stream
+      @data_stream = uString
 
-        # Convert the unicode string into a list to be used as the data stream
-        @dataStream = uString
+      @queue = []
 
-        @queue = []
-
-        # Reset position in the list to read from
-        reset
+      # Reset position in the list to read from
+      reset
     end
 
     # Produces a file object from source.
     #
     # source can be either a file object, local filename or a string.
-    def openStream(source)
-        # Already an IO like object
-        if source.respond_to?(:read)
-            @stream = source
-        else
-            # Treat source as a string and wrap in StringIO
-            @stream = StringIO.new(source)
-        end
-        return @stream
+    def open_stream(source)
+      # Already an IO like object
+      if source.respond_to?(:read)
+        @stream = source
+      else
+        # Treat source as a string and wrap in StringIO
+        @stream = StringIO.new(source)
+      end
+      return @stream
     end
 
-    def detectEncoding
+    def detect_encoding
 
-        #First look for a BOM
-        #This will also read past the BOM if present
-        encoding = detectBOM
-        #If there is no BOM need to look for meta elements with encoding 
-        #information
-        if encoding.nil? and @parseMeta
-            encoding = detectEncodingMeta
+      #First look for a BOM
+      #This will also read past the BOM if present
+      encoding = detect_bom
+      #If there is no BOM need to look for meta elements with encoding 
+      #information
+      if encoding.nil? and @parse_meta
+        encoding = detect_encoding_meta
+      end
+      #Guess with chardet, if avaliable
+      if encoding.nil? and @chardet
+        begin
+          require 'rubygems'
+          require 'UniversalDetector' # gem install chardet
+          buffer = @raw_stream.read
+          encoding = UniversalDetector::chardet(buffer)['encoding']
+          @raw_stream = open_stream(buffer)
+        rescue LoadError
         end
-        #Guess with chardet, if avaliable
-        if encoding.nil? and @chardet
-            begin
-                require 'rubygems'
-                require 'UniversalDetector' # gem install chardet
-                buffer = @rawStream.read
-                encoding = UniversalDetector::chardet(buffer)['encoding']
-                @rawStream = openStream(buffer)
-            rescue LoadError
-            end
-        end
-        # If all else fails use the default encoding
-        if encoding.nil?
-            encoding = @DEFAULT_ENCODING
-        end
-        
-        #Substitute for equivalent encodings:
-        encodingSub = {'ascii' => 'windows-1252', 'iso-8859-1' => 'windows-1252'}
+      end
+      # If all else fails use the default encoding
+      if encoding.nil?
+        encoding = @DEFAULT_ENCODING
+      end
+    
+      #Substitute for equivalent encodings:
+      encoding_sub = {'ascii' => 'windows-1252', 'iso-8859-1' => 'windows-1252'}
 
-        if encodingSub.has_key?(encoding.downcase)
-            encoding = encodingSub[encoding.downcase]
-        end
+      if encoding_sub.has_key?(encoding.downcase)
+        encoding = encoding_sub[encoding.downcase]
+      end
 
-        return encoding
+      return encoding
     end
 
     # Attempts to detect at BOM at the start of the stream. If
     # an encoding can be determined from the BOM return the name of the
     # encoding otherwise return nil
-    def detectBOM
-        bomDict = {
-            "\xef\xbb\xbf" => 'utf-8',
-            "\xff\xfe" => 'utf-16-le',
-            "\xfe\xff" => 'utf-16-be',
-            "\xff\xfe\x00\x00" => 'utf-32-le',
-            "\x00\x00\xfe\xff" => 'utf-32-be'
-        }
+    def detect_bom
+      bom_dict = {
+        "\xef\xbb\xbf" => 'utf-8',
+        "\xff\xfe" => 'utf-16-le',
+        "\xfe\xff" => 'utf-16-be',
+        "\xff\xfe\x00\x00" => 'utf-32-le',
+        "\x00\x00\xfe\xff" => 'utf-32-be'
+      }
 
-        # Go to beginning of file and read in 4 bytes
-        @rawStream.seek(0)
-        string = @rawStream.read(4)
-        return nil unless string
+      # Go to beginning of file and read in 4 bytes
+      @raw_stream.seek(0)
+      string = @raw_stream.read(4)
+      return nil unless string
 
-        # Try detecting the BOM using bytes from the string
-        encoding = bomDict[string[0...3]]          # UTF-8
-        seek = 3
+      # Try detecting the BOM using bytes from the string
+      encoding = bom_dict[string[0...3]]      # UTF-8
+      seek = 3
+      unless encoding
+        # Need to detect UTF-32 before UTF-16
+        encoding = bom_dict[string]       # UTF-32
+        seek = 4
         unless encoding
-            # Need to detect UTF-32 before UTF-16
-            encoding = bomDict[string]             # UTF-32
-            seek = 4
-            unless encoding
-                encoding = bomDict[string[0...2]]  # UTF-16
-                seek = 2
-            end
+          encoding = bom_dict[string[0...2]]  # UTF-16
+          seek = 2
         end
+      end
 
-        #AT - move this to the caller?
-        # Set the read position past the BOM if one was found, otherwise
-        # set it to the start of the stream
-        @rawStream.seek(encoding ? seek : 0)
+      #AT - move this to the caller?
+      # Set the read position past the BOM if one was found, otherwise
+      # set it to the start of the stream
+      @raw_stream.seek(encoding ? seek : 0)
 
-        return encoding
+      return encoding
     end
 
     # Report the encoding declared by the meta element
-    def detectEncodingMeta
-        parser = EncodingParser.new(@rawStream.read(@NUM_BYTES_META))
-        @rawStream.seek(0)
-        return parser.getEncoding
+    def detect_encoding_meta
+      parser = EncodingParser.new(@raw_stream.read(@NUM_BYTES_META))
+      @raw_stream.seek(0)
+      return parser.get_encoding
     end
 
-    def determineNewLines
-        # Looks through the stream to find where new lines occur so
-        # the position method can tell where it is.
-        @newLines.push(0)
-        (0...@dataStream.length).each { |i| @newLines.push(i) if @dataStream[i] == ?\n }
+    def determine_new_lines
+      # Looks through the stream to find where new lines occur so
+      # the position method can tell where it is.
+      @new_lines.push(0)
+      (0...@data_stream.length).each { |i| @new_lines.push(i) if @data_stream[i] == ?\n }
     end
 
     # Returns (line, col) of the current position in the stream.
     def position
-        # Generate list of new lines first time around
-        determineNewLines if @newLines.empty?
-        line = 0
-        tell = @tell
-        @newLines.each do |pos|
-            break unless pos < tell
-            line += 1
-        end
-        col = tell - @newLines[line-1] - 1
-        return [line, col]
+      # Generate list of new lines first time around
+      determine_new_lines if @new_lines.empty?
+      line = 0
+      tell = @tell
+      @new_lines.each do |pos|
+        break unless pos < tell
+        line += 1
+      end
+      col = tell - @new_lines[line-1] - 1
+      return [line, col]
     end
 
     # Resets the position in the stream back to the start.
     def reset
-        @tell = 0
+      @tell = 0
     end
 
     # Read one character from the stream or queue if available. Return
     # EOF when EOF is reached.
     def char
-        unless @queue.empty?
-            return @queue.shift
-        else
-            begin
-                @tell += 1
-                return @dataStream[@tell - 1].chr
-            rescue
-                return :EOF
-            end
+      unless @queue.empty?
+        return @queue.shift
+      else
+        begin
+          @tell += 1
+          return @data_stream[@tell - 1].chr
+        rescue
+          return :EOF
         end
+      end
     end
 
     # Returns a string of characters from the stream up to but not
     # including any character in characters or EOF. characters can be
     # any container that supports the in method being called on it.
-    def charsUntil(characters, opposite = false)
-        charStack = [char]
+    def chars_until(characters, opposite=false)
+      char_stack = [char]
 
-        unless charStack[0] == :EOF
-            while (characters.include? charStack[-1]) == opposite
-                unless @queue.empty?
-                    # First from the queue
-                    charStack.push(@queue.shift)
-                    break if charStack[-1] == :EOF
-                else
-                    # Then the rest
-                    begin
-                        charStack.push(@dataStream[@tell].chr)
-                        @tell += 1
-                    rescue
-                        charStack.push(:EOF)
-                        break
-                    end
-                end
+      unless char_stack[0] == :EOF
+        while (characters.include? char_stack[-1]) == opposite
+          unless @queue.empty?
+            # First from the queue
+            char_stack.push(@queue.shift)
+            break if char_stack[-1] == :EOF
+          else
+            # Then the rest
+            begin
+              char_stack.push(@data_stream[@tell].chr)
+              @tell += 1
+            rescue
+              char_stack.push(:EOF)
+              break
             end
+          end
         end
+      end
 
-        # Put the character stopped on back to the front of the queue
-        # from where it came.
-        @queue.insert(0, charStack.pop)
-        return charStack.join('')
+      # Put the character stopped on back to the front of the queue
+      # from where it came.
+      @queue.insert(0, char_stack.pop)
+      return char_stack.join('')
     end
-end
+  end
 
-# String-like object with an assosiated position and various extra methods
-# If the position is ever greater than the string length then an exception is raised
-class EncodingBytes < String
+  # String-like object with an assosiated position and various extra methods
+  # If the position is ever greater than the string length then an exception is raised
+  class EncodingBytes < String
 
     attr_accessor :position
 
     def initialize(value)
-        super(value)
-        @position = -1
+      super(value)
+      @position = -1
     end
-    
+  
     def each
-        while @position < length
-            @position += 1
-            yield self[@position]
-        end
+      while @position < length
+        @position += 1
+        yield self[@position]
+      end
     rescue EOF
     end
-    
-    def currentByte
-        raise EOF if @position >= length
-        return self[@position].chr
+  
+    def current_byte
+      raise EOF if @position >= length
+      return self[@position].chr
     end
-    
+  
     # Skip past a list of characters
-    def skip(chars = SPACE_CHARACTERS)
-        while chars.include?(currentByte)
-            @position += 1
-        end
+    def skip(chars=SPACE_CHARACTERS)
+      while chars.include?(current_byte)
+        @position += 1
+      end
     end
 
     # Look for a sequence of bytes at the start of a string. If the bytes 
     # are found return true and advance the position to the byte after the 
     # match. Otherwise return false and leave the position alone
-    def matchBytes(bytes, lower = false)
-        data = self[position ... position+bytes.length]
-        data.downcase! if lower
-        rv = (data == bytes)
-        @position += bytes.length if rv == true
-        return rv
+    def match_bytes(bytes, lower=false)
+      data = self[position ... position+bytes.length]
+      data.downcase! if lower
+      rv = (data == bytes)
+      @position += bytes.length if rv == true
+      return rv
     end
-    
+  
     # Look for the next sequence of bytes matching a given sequence. If
     # a match is found advance the position to the last byte of the match
-    def jumpTo(bytes)
-        newPosition = self[position .. -1].index(bytes)
-        if newPosition
-            @position += (newPosition + bytes.length-1)
-            return true
-        else
-            raise EOF
-        end
+    def jump_to(bytes)
+      new_position = self[position .. -1].index(bytes)
+      if new_position
+        @position += (new_position + bytes.length-1)
+        return true
+      else
+        raise EOF
+      end
     end
-    
+  
     # Move the pointer so it points to the next byte in a set of possible
     # bytes
-    def findNext(byteList)
-        until byteList.include?(currentByte)
-            @position += 1
-        end
+    def find_next(byte_list)
+      until byte_list.include?(current_byte)
+        @position += 1
+      end
     end
-end
+  end
 
-# Mini parser for detecting character encoding from meta elements
-class EncodingParser
+  # Mini parser for detecting character encoding from meta elements
+  class EncodingParser
 
     # string - the data to work on for encoding detection
     def initialize(data)
-        @data = EncodingBytes.new(data.to_s)
-        @encoding = nil
+      @data = EncodingBytes.new(data.to_s)
+      @encoding = nil
     end
 
     @@method_dispatch = [
-        ['<!--', :handleComment],
-        ['<meta', :handleMeta],
-        ['</', :handlePossibleEndTag],
-        ['<!', :handleOther],
-        ['<?', :handleOther],
-        ['<', :handlePossibleStartTag]
+      ['<!--', :handle_comment],
+      ['<meta', :handle_meta],
+      ['</', :handle_possible_end_tag],
+      ['<!', :handle_other],
+      ['<?', :handle_other],
+      ['<', :handle_possible_start_tag]
     ]
 
-    def getEncoding
-        @data.each do |byte|
-            keepParsing = true
-            @@method_dispatch.each do |(key, method)|
-                if @data.matchBytes(key, lower = true)
-                    keepParsing = send(method)    
-                    break
-                end
-            end
-            break unless keepParsing
+    def get_encoding
+      @data.each do |byte|
+        keep_parsing = true
+        @@method_dispatch.each do |(key, method)|
+          if @data.match_bytes(key, lower = true)
+            keep_parsing = send(method)
+            break
+          end
         end
-        @encoding = @encoding.strip unless @encoding.nil?
-        return @encoding
+        break unless keep_parsing
+      end
+      @encoding = @encoding.strip unless @encoding.nil?
+      return @encoding
     end
 
     # Skip over comments
-    def handleComment
-        return @data.jumpTo('-->')
+    def handle_comment
+      return @data.jump_to('-->')
     end
 
-    def handleMeta
-        # if we have <meta not followed by a space so just keep going
-        return true unless SPACE_CHARACTERS.include?(@data.currentByte)
+    def handle_meta
+      # if we have <meta not followed by a space so just keep going
+      return true unless SPACE_CHARACTERS.include?(@data.current_byte)
 
-        #We have a valid meta element we want to search for attributes
-        while true
-            #Try to find the next attribute after the current position
-            attr = getAttribute
+      #We have a valid meta element we want to search for attributes
+      while true
+        #Try to find the next attribute after the current position
+        attr = get_attribute
 
-            return true if attr.nil?
-                
-            if attr[0] == 'charset'
-                tentativeEncoding = attr[1]
-                if HTML5lib.isValidEncoding(tentativeEncoding)
-                    @encoding = tentativeEncoding    
-                    return false
-                end
-            elsif attr[0] == 'content'
-                contentParser = ContentAttrParser.new(EncodingBytes.new(attr[1]))
-                tentativeEncoding = contentParser.parse
-                if HTML5lib.isValidEncoding(tentativeEncoding)
-                    @encoding = tentativeEncoding    
-                    return false
-                end
-            end
-        end
-    end
-
-    def handlePossibleStartTag
-        return handlePossibleTag(false)
-    end
-
-    def handlePossibleEndTag
-        @data.position+=1
-        return handlePossibleTag(true)
-    end
-
-    def handlePossibleTag(endTag)
-        unless ASCII_LETTERS.include?(@data.currentByte)
-            #If the next byte is not an ascii letter either ignore this
-            #fragment (possible start tag case) or treat it according to 
-            #handleOther
-            if endTag
-                @data.position -= 1
-                handleOther
-            end
-            return true
-        end
+        return true if attr.nil?
         
-        @data.findNext(SPACE_CHARACTERS + ['<', '>'])
+        if attr[0] == 'charset'
+          tentative_encoding = attr[1]
+          if HTML5lib.is_valid_encoding(tentative_encoding)
+            @encoding = tentative_encoding  
+            return false
+          end
+        elsif attr[0] == 'content'
+          content_parser = ContentAttrParser.new(EncodingBytes.new(attr[1]))
+          tentative_encoding = content_parser.parse
+          if HTML5lib.is_valid_encoding(tentative_encoding)
+            @encoding = tentative_encoding
+            return false
+          end
+        end
+      end
+    end
 
-        if @data.currentByte == '<'
-            #return to the first step in the overall "two step" algorithm
-            #reprocessing the < byte
-            @data.position -= 1    
-        else
-            #Read all attributes
-            {} until getAttribute.nil?
+    def handle_possible_start_tag
+      return handle_possible_tag(false)
+    end
+
+    def handle_possible_end_tag
+      @data.position += 1
+      return handle_possible_tag(true)
+    end
+
+    def handle_possible_tag(end_tag)
+      unless ASCII_LETTERS.include?(@data.current_byte)
+        #If the next byte is not an ascii letter either ignore this
+        #fragment (possible start tag case) or treat it according to 
+        #handleOther
+        if end_tag
+          @data.position -= 1
+          handle_other
         end
         return true
+      end
+    
+      @data.find_next(SPACE_CHARACTERS + ['<', '>'])
+
+      if @data.current_byte == '<'
+        #return to the first step in the overall "two step" algorithm
+        #reprocessing the < byte
+        @data.position -= 1  
+      else
+        #Read all attributes
+        {} until get_attribute.nil?
+      end
+      return true
     end
 
-    def handleOther
-        return @data.jumpTo('>')
+    def handle_other
+      return @data.jump_to('>')
     end
 
-    # Return a name,value pair for the next attribute in the stream, 
+    # Return a name,value pair for the next attribute in the stream,
     # if one is found, or nil
-    def getAttribute
-        @data.skip(SPACE_CHARACTERS + ['/'])
+    def get_attribute
+      @data.skip(SPACE_CHARACTERS + ['/'])
 
-        if @data.currentByte == '<'
-            @data.position -= 1
-            return nil
-        elsif @data.currentByte == '>'
-            return nil
-        end
+      if @data.current_byte == '<'
+        @data.position -= 1
+        return nil
+      elsif @data.current_byte == '>'
+        return nil
+      end
 
-        attrName = []
-        attrValue = []
-        spaceFound = false
-        #Step 5 attribute name
-        while true
-            if @data.currentByte == '=' and attrName:   
-                break
-            elsif SPACE_CHARACTERS.include?(@data.currentByte)
-                spaceFound = true
-                break
-            elsif ['/', '<', '>'].include?(@data.currentByte)
-                return [attrName.join(''), '']
-            elsif ASCII_UPPERCASE.include?(@data.currentByte)
-                attrName.push(@data.currentByte.downcase)
-            else
-                attrName.push(@data.currentByte)
-            end
-            #Step 6
-            @data.position += 1
-        end
-        #Step 7
-        if spaceFound
-            @data.skip
-            #Step 8
-            unless @data.currentByte == '='
-                @data.position -= 1
-                return [attrName.join(''), '']
-            end
-        end
-        #XXX need to advance position in both spaces and value case
-        #Step 9
-        @data.position += 1
-        #Step 10
-        @data.skip
-        #Step 11
-        if ["'", '"'].include?(@data.currentByte)
-            #11.1
-            quoteChar = @data.currentByte
-            while true
-                @data.position+=1
-                #11.3
-                if @data.currentByte == quoteChar
-                    @data.position += 1
-                    return [attrName.join(''), attrValue.join('')]
-                #11.4
-                elsif ASCII_UPPERCASE.include?(@data.currentByte)
-                    attrValue.push(@data.currentByte.downcase)
-                #11.5
-                else
-                    attrValue.push(@data.currentByte)
-                end
-            end
-        elsif ['>', '<'].include?(@data.currentByte)
-            return [attrName.join(''), '']
-        elsif ASCII_UPPERCASE.include?(@data.currentByte)
-            attrValue.push(@data.currentByte.downcase)
+      attr_name = []
+      attr_value = []
+      space_found = false
+      #Step 5 attribute name
+      while true
+        if @data.current_byte == '=' and attr_name:
+          break
+        elsif SPACE_CHARACTERS.include?(@data.current_byte)
+          space_found = true
+          break
+        elsif ['/', '<', '>'].include?(@data.current_byte)
+          return [attr_name.join(''), '']
+        elsif ASCII_UPPERCASE.include?(@data.current_byte)
+          attr_name.push(@data.current_byte.downcase)
         else
-            attrValue.push(@data.currentByte)
+          attr_name.push(@data.current_byte)
         end
+        #Step 6
+        @data.position += 1
+      end
+      #Step 7
+      if space_found
+        @data.skip
+        #Step 8
+        unless @data.current_byte == '='
+          @data.position -= 1
+          return [attr_name.join(''), '']
+        end
+      end
+      #XXX need to advance position in both spaces and value case
+      #Step 9
+      @data.position += 1
+      #Step 10
+      @data.skip
+      #Step 11
+      if ["'", '"'].include?(@data.current_byte)
+        #11.1
+        quote_char = @data.current_byte
         while true
-            @data.position +=1
-            if (SPACE_CHARACTERS + ['>', '<']).include?(@data.currentByte)
-                return [attrName.join(''), attrValue.join('')]
-            elsif ASCII_UPPERCASE.include?(@data.currentByte)
-                attrValue.push(@data.currentByte.downcase)
-            else
-                attrValue.push(@data.currentByte)
-            end
+          @data.position+=1
+          #11.3
+          if @data.current_byte == quote_char
+            @data.position += 1
+            return [attr_name.join(''), attr_value.join('')]
+          #11.4
+          elsif ASCII_UPPERCASE.include?(@data.current_byte)
+            attr_value.push(@data.current_byte.downcase)
+          #11.5
+          else
+            attr_value.push(@data.current_byte)
+          end
         end
+      elsif ['>', '<'].include?(@data.current_byte)
+        return [attr_name.join(''), '']
+      elsif ASCII_UPPERCASE.include?(@data.current_byte)
+        attr_value.push(@data.current_byte.downcase)
+      else
+        attr_value.push(@data.current_byte)
+      end
+      while true
+        @data.position += 1
+        if (SPACE_CHARACTERS + ['>', '<']).include?(@data.current_byte)
+          return [attr_name.join(''), attr_value.join('')]
+        elsif ASCII_UPPERCASE.include?(@data.current_byte)
+          attr_value.push(@data.current_byte.downcase)
+        else
+          attr_value.push(@data.current_byte)
+        end
+      end
     end
-end
+  end
 
-class ContentAttrParser
+  class ContentAttrParser
     def initialize(data)
-        @data = data
+      @data = data
     end
+
     def parse
-        begin
-            #Skip to the first ";"
-            @data.position = 0
-            @data.jumpTo(';')
-            @data.position += 1
-            @data.skip
-            #Check if the attr name is charset 
-            #otherwise return
-            @data.jumpTo('charset')
-            @data.position += 1
-            @data.skip
-            unless @data.currentByte == '='
-                #If there is no = sign keep looking for attrs
-                return nil
-            end
-            @data.position += 1
-            @data.skip
-            #Look for an encoding between matching quote marks
-            if ['"', "'"].include?(@data.currentByte)
-                quoteMark = @data.currentByte
-                @data.position += 1
-                oldPosition = @data.position
-                @data.jumpTo(quoteMark)
-                return @data[oldPosition ... @data.position]
-            else
-                #Unquoted value
-                oldPosition = @data.position
-                begin
-                    @data.findNext(SPACE_CHARACTERS)
-                    return @data[oldPosition ... @data.position]
-                rescue EOF
-                    #Return the whole remaining value
-                    return @data[oldPosition .. -1]
-                end
-            end
-        rescue EOF
-            return nil
+      begin
+        #Skip to the first ";"
+        @data.position = 0
+        @data.jump_to(';')
+        @data.position += 1
+        @data.skip
+        #Check if the attr name is charset 
+        #otherwise return
+        @data.jump_to('charset')
+        @data.position += 1
+        @data.skip
+        unless @data.current_byte == '='
+          #If there is no = sign keep looking for attrs
+          return nil
         end
+        @data.position += 1
+        @data.skip
+        #Look for an encoding between matching quote marks
+        if ['"', "'"].include?(@data.current_byte)
+          quote_mark = @data.current_byte
+          @data.position += 1
+          old_position = @data.position
+          @data.jump_to(quote_mark)
+          return @data[old_position ... @data.position]
+        else
+          #Unquoted value
+          old_position = @data.position
+          begin
+            @data.find_next(SPACE_CHARACTERS)
+            return @data[old_position ... @data.position]
+          rescue EOF
+            #Return the whole remaining value
+            return @data[old_position .. -1]
+          end
+        end
+      rescue EOF
+        return nil
+      end
     end
-end
+  end
 
-# Determine if a string is a supported encoding
-def self.isValidEncoding(encoding)
+  # Determine if a string is a supported encoding
+  def self.is_valid_encoding(encoding)
     (not encoding.nil? and encoding.kind_of?(String) and ENCODINGS.include?(encoding.downcase.strip))
-end
+  end
 
 end
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/liberalxmlparser.rb b/vendor/plugins/HTML5lib/lib/html5lib/liberalxmlparser.rb
index 566ecadc..5410b98e 100755
--- a/vendor/plugins/HTML5lib/lib/html5lib/liberalxmlparser.rb
+++ b/vendor/plugins/HTML5lib/lib/html5lib/liberalxmlparser.rb
@@ -16,126 +16,126 @@ require 'html5lib/constants'
 
 module HTML5lib
 
-# liberal XML parser
-class XMLParser < HTMLParser
+  # liberal XML parser
+  class XMLParser < HTMLParser
 
-    def initialize(options={})
-        super options
-        @phases[:initial] = XmlRootPhase.new(self, @tree)
+    def initialize(options = {})
+      super options
+      @phases[:initial] = XmlRootPhase.new(self, @tree)
     end
 
     def normalizeToken(token)
-        if token[:type] == :StartTag or token[:type] == :EmptyTag
-            # We need to remove the duplicate attributes and convert attributes
-            # to a dict so that [["x", "y"], ["x", "z"]] becomes {"x": "y"}
+      if token[:type] == :StartTag or token[:type] == :EmptyTag
+        # We need to remove the duplicate attributes and convert attributes
+        # to a dict so that [["x", "y"], ["x", "z"]] becomes {"x": "y"}
 
-            token[:data] = Hash[*token[:data].reverse.flatten]
+        token[:data] = Hash[*token[:data].reverse.flatten]
 
-            # For EmptyTags, process both a Start and an End tag
-            if token[:type] == :EmptyTag
-                @phase.processStartTag(token[:name], token[:data])
-                token[:data] = {}
-                token[:type] = :EndTag
-            end
-
-        elsif token[:type] == :EndTag
-            if token[:data]
-               parseError(_("End tag contains unexpected attributes."))
-            end
-
-        elsif token[:type] == :Comment
-            # Rescue CDATA from the comments
-            if token[:data][0..6] == "[CDATA[" and token[:data][-2..-1] == "]]"
-                token[:type] = :Characters
-                token[:data] = token[:data][7 ... -2]
-            end
+        # For EmptyTags, process both a Start and an End tag
+        if token[:type] == :EmptyTag
+          @phase.processStartTag(token[:name], token[:data])
+          token[:data] = {}
+          token[:type] = :EndTag
         end
 
-        return token
+      elsif token[:type] == :EndTag
+        if token[:data]
+           parseError(_("End tag contains unexpected attributes."))
+        end
+
+      elsif token[:type] == :Comment
+        # Rescue CDATA from the comments
+        if token[:data][0..6] == "[CDATA[" and token[:data][-2..-1] == "]]"
+          token[:type] = :Characters
+          token[:data] = token[:data][7 ... -2]
+        end
+      end
+
+      return token
     end
-end
+  end
 
-# liberal XMTHML parser
-class XHTMLParser < XMLParser
+  # liberal XMTHML parser
+  class XHTMLParser < XMLParser
 
-    def initialize(options={})
-        super options
-        @phases[:initial] = InitialPhase.new(self, @tree)
-        @phases[:rootElement] = XhmlRootPhase.new(self, @tree)
+    def initialize(options = {})
+      super options
+      @phases[:initial] = InitialPhase.new(self, @tree)
+      @phases[:rootElement] = XhmlRootPhase.new(self, @tree)
     end
 
     def normalizeToken(token)
-        super(token)
+      super(token)
 
-        # ensure that non-void XHTML elements have content so that separate
-        # open and close tags are emitted
-        if token[:type]  == :EndTag and \
-            not VOID_ELEMENTS.include? token[:name] and \
-            token[:name] == @tree.openElements[-1].name and \
-            not @tree.openElements[-1].hasContent
-            @tree.insertText('') unless
-                @tree.openElements.any? {|e|
-                    e.attributes.keys.include? 'xmlns' and
-                    e.attributes['xmlns'] != 'http://www.w3.org/1999/xhtml'
-                }
-        end
+      # ensure that non-void XHTML elements have content so that separate
+      # open and close tags are emitted
+      if token[:type]  == :EndTag and \
+        not VOID_ELEMENTS.include? token[:name] and \
+        token[:name] == @tree.openElements[-1].name and \
+        not @tree.openElements[-1].hasContent
+        @tree.insertText('') unless
+          @tree.openElements.any? {|e|
+            e.attributes.keys.include? 'xmlns' and
+            e.attributes['xmlns'] != 'http://www.w3.org/1999/xhtml'
+          }
+      end
 
-        return token
+      return token
     end
-end
+  end
 
-class XhmlRootPhase < RootElementPhase
+  class XhmlRootPhase < RootElementPhase
     def insertHtmlElement
-        element = @tree.createElement("html", {'xmlns' => 'http://www.w3.org/1999/xhtml'})
-        @tree.openElements.push(element)
-        @tree.document.appendChild(element)
-        @parser.phase = @parser.phases[:beforeHead]
+      element = @tree.createElement("html", {'xmlns' => 'http://www.w3.org/1999/xhtml'})
+      @tree.openElements.push(element)
+      @tree.document.appendChild(element)
+      @parser.phase = @parser.phases[:beforeHead]
     end
-end
+  end
 
-class XmlRootPhase < Phase
+  class XmlRootPhase < Phase
     # Prime the Xml parser
     @start_tag_handlers = Hash.new(:startTagOther)
     @end_tag_handlers = Hash.new(:endTagOther)
     def startTagOther(name, attributes)
-        @tree.openElements.push(@tree.document)
-        element = @tree.createElement(name, attributes)
-        @tree.openElements[-1].appendChild(element)
-        @tree.openElements.push(element)
-        @parser.phase = XmlElementPhase.new(@parser,@tree)
+      @tree.openElements.push(@tree.document)
+      element = @tree.createElement(name, attributes)
+      @tree.openElements[-1].appendChild(element)
+      @tree.openElements.push(element)
+      @parser.phase = XmlElementPhase.new(@parser,@tree)
     end
     def endTagOther(name)
-        super
-        @tree.openElements.pop
+      super
+      @tree.openElements.pop
     end
-end
+  end
 
-class XmlElementPhase < Phase
+  class XmlElementPhase < Phase
     # Generic handling for all XML elements
 
     @start_tag_handlers = Hash.new(:startTagOther)
     @end_tag_handlers = Hash.new(:endTagOther)
 
     def startTagOther(name, attributes)
-        element = @tree.createElement(name, attributes)
-        @tree.openElements[-1].appendChild(element)
-        @tree.openElements.push(element)
+      element = @tree.createElement(name, attributes)
+      @tree.openElements[-1].appendChild(element)
+      @tree.openElements.push(element)
     end
 
     def endTagOther(name)
-        for node in @tree.openElements.reverse
-            if node.name == name
-                {} while @tree.openElements.pop != node
-                break
-            else
-                @parser.parseError
-            end
+      for node in @tree.openElements.reverse
+        if node.name == name
+          {} while @tree.openElements.pop != node
+          break
+        else
+          @parser.parseError
         end
+      end
     end
 
     def processCharacters(data)
-        @tree.insertText(data)
+      @tree.insertText(data)
     end
-end
+  end
 
 end
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/sanitizer.rb b/vendor/plugins/HTML5lib/lib/html5lib/sanitizer.rb
index ca87f91a..6f7cdcac 100644
--- a/vendor/plugins/HTML5lib/lib/html5lib/sanitizer.rb
+++ b/vendor/plugins/HTML5lib/lib/html5lib/sanitizer.rb
@@ -6,87 +6,87 @@ module HTML5lib
 # This module provides sanitization of XHTML+MathML+SVG
 # and of inline style attributes.
 
-class HTMLSanitizer < HTMLTokenizer
+  class HTMLSanitizer < HTMLTokenizer
 
     ACCEPTABLE_ELEMENTS = %w[a abbr acronym address area b big blockquote br
-        button caption center cite code col colgroup dd del dfn dir div dl dt
-        em fieldset font form h1 h2 h3 h4 h5 h6 hr i img input ins kbd label
-        legend li map menu ol optgroup option p pre q s samp select small span
-        strike strong sub sup table tbody td textarea tfoot th thead tr tt u
-        ul var]
+      button caption center cite code col colgroup dd del dfn dir div dl dt
+      em fieldset font form h1 h2 h3 h4 h5 h6 hr i img input ins kbd label
+      legend li map menu ol optgroup option p pre q s samp select small span
+      strike strong sub sup table tbody td textarea tfoot th thead tr tt u
+      ul var]
 
     MATHML_ELEMENTS = %w[maction math merror mfrac mi mmultiscripts mn mo
-        mover mpadded mphantom mprescripts mroot mrow mspace msqrt mstyle msub
-        msubsup msup mtable mtd mtext mtr munder munderover none]
+      mover mpadded mphantom mprescripts mroot mrow mspace msqrt mstyle msub
+      msubsup msup mtable mtd mtext mtr munder munderover none]
 
     SVG_ELEMENTS = %w[a animate animateColor animateMotion animateTransform
-        circle defs desc ellipse font-face font-face-name font-face-src g
-        glyph hkern image linearGradient line marker metadata missing-glyph
-        mpath path polygon polyline radialGradient rect set stop svg switch
-        text title tspan use]
+      circle defs desc ellipse font-face font-face-name font-face-src g
+      glyph hkern image linearGradient line marker metadata missing-glyph
+      mpath path polygon polyline radialGradient rect set stop svg switch
+      text title tspan use]
 
     ACCEPTABLE_ATTRIBUTES = %w[abbr accept accept-charset accesskey action
-        align alt axis border cellpadding cellspacing char charoff charset
-        checked cite class clear cols colspan color compact coords datetime
-        dir disabled enctype for frame headers height href hreflang hspace id
-        ismap label lang longdesc maxlength media method multiple name nohref
-        noshade nowrap prompt readonly rel rev rows rowspan rules scope
-        selected shape size span src start style summary tabindex target title
-        type usemap valign value vspace width xml:lang]
+      align alt axis border cellpadding cellspacing char charoff charset
+      checked cite class clear cols colspan color compact coords datetime
+      dir disabled enctype for frame headers height href hreflang hspace id
+      ismap label lang longdesc maxlength media method multiple name nohref
+      noshade nowrap prompt readonly rel rev rows rowspan rules scope
+      selected shape size span src start style summary tabindex target title
+      type usemap valign value vspace width xml:lang]
 
     MATHML_ATTRIBUTES = %w[actiontype align columnalign columnalign
-        columnalign columnlines columnspacing columnspan depth display
-        displaystyle equalcolumns equalrows fence fontstyle fontweight frame
-        height linethickness lspace mathbackground mathcolor mathvariant
-        mathvariant maxsize minsize other rowalign rowalign rowalign rowlines
-        rowspacing rowspan rspace scriptlevel selection separator stretchy
-        width width xlink:href xlink:show xlink:type xmlns xmlns:xlink]
+      columnalign columnlines columnspacing columnspan depth display
+      displaystyle equalcolumns equalrows fence fontstyle fontweight frame
+      height linethickness lspace mathbackground mathcolor mathvariant
+      mathvariant maxsize minsize other rowalign rowalign rowalign rowlines
+      rowspacing rowspan rspace scriptlevel selection separator stretchy
+      width width xlink:href xlink:show xlink:type xmlns xmlns:xlink]
 
     SVG_ATTRIBUTES = %w[accent-height accumulate additive alphabetic
-         arabic-form ascent attributeName attributeType baseProfile bbox begin
-         by calcMode cap-height class color color-rendering content cx cy d dx
-         dy descent display dur end fill fill-rule font-family font-size
-         font-stretch font-style font-variant font-weight from fx fy g1 g2
-         glyph-name gradientUnits hanging height horiz-adv-x horiz-origin-x id
-         ideographic k keyPoints keySplines keyTimes lang marker-end
-         marker-mid marker-start markerHeight markerUnits markerWidth
-         mathematical max min name offset opacity orient origin
-         overline-position overline-thickness panose-1 path pathLength points
-         preserveAspectRatio r refX refY repeatCount repeatDur
-         requiredExtensions requiredFeatures restart rotate rx ry slope stemh
-         stemv stop-color stop-opacity strikethrough-position
-         strikethrough-thickness stroke stroke-dasharray stroke-dashoffset
-         stroke-linecap stroke-linejoin stroke-miterlimit stroke-opacity
-         stroke-width systemLanguage target text-anchor to transform type u1
-         u2 underline-position underline-thickness unicode unicode-range
-         units-per-em values version viewBox visibility width widths x
-         x-height x1 x2 xlink:actuate xlink:arcrole xlink:href xlink:role
-         xlink:show xlink:title xlink:type xml:base xml:lang xml:space xmlns
-         xmlns:xlink y y1 y2 zoomAndPan]
+       arabic-form ascent attributeName attributeType baseProfile bbox begin
+       by calcMode cap-height class color color-rendering content cx cy d dx
+       dy descent display dur end fill fill-rule font-family font-size
+       font-stretch font-style font-variant font-weight from fx fy g1 g2
+       glyph-name gradientUnits hanging height horiz-adv-x horiz-origin-x id
+       ideographic k keyPoints keySplines keyTimes lang marker-end
+       marker-mid marker-start markerHeight markerUnits markerWidth
+       mathematical max min name offset opacity orient origin
+       overline-position overline-thickness panose-1 path pathLength points
+       preserveAspectRatio r refX refY repeatCount repeatDur
+       requiredExtensions requiredFeatures restart rotate rx ry slope stemh
+       stemv stop-color stop-opacity strikethrough-position
+       strikethrough-thickness stroke stroke-dasharray stroke-dashoffset
+       stroke-linecap stroke-linejoin stroke-miterlimit stroke-opacity
+       stroke-width systemLanguage target text-anchor to transform type u1
+       u2 underline-position underline-thickness unicode unicode-range
+       units-per-em values version viewBox visibility width widths x
+       x-height x1 x2 xlink:actuate xlink:arcrole xlink:href xlink:role
+       xlink:show xlink:title xlink:type xml:base xml:lang xml:space xmlns
+       xmlns:xlink y y1 y2 zoomAndPan]
 
     ATTR_VAL_IS_URI = %w[href src cite action longdesc xlink:href]
 
     ACCEPTABLE_CSS_PROPERTIES = %w[azimuth background-color
-        border-bottom-color border-collapse border-color border-left-color
-        border-right-color border-top-color clear color cursor direction
-        display elevation float font font-family font-size font-style
-        font-variant font-weight height letter-spacing line-height overflow
-        pause pause-after pause-before pitch pitch-range richness speak
-        speak-header speak-numeral speak-punctuation speech-rate stress
-        text-align text-decoration text-indent unicode-bidi vertical-align
-        voice-family volume white-space width]
+      border-bottom-color border-collapse border-color border-left-color
+      border-right-color border-top-color clear color cursor direction
+      display elevation float font font-family font-size font-style
+      font-variant font-weight height letter-spacing line-height overflow
+      pause pause-after pause-before pitch pitch-range richness speak
+      speak-header speak-numeral speak-punctuation speech-rate stress
+      text-align text-decoration text-indent unicode-bidi vertical-align
+      voice-family volume white-space width]
 
     ACCEPTABLE_CSS_KEYWORDS = %w[auto aqua black block blue bold both bottom
-        brown center collapse dashed dotted fuchsia gray green !important
-        italic left lime maroon medium none navy normal nowrap olive pointer
-        purple red right solid silver teal top transparent underline white
-        yellow]
+      brown center collapse dashed dotted fuchsia gray green !important
+      italic left lime maroon medium none navy normal nowrap olive pointer
+      purple red right solid silver teal top transparent underline white
+      yellow]
 
     ACCEPTABLE_SVG_PROPERTIES = %w[fill fill-opacity fill-rule stroke
-        stroke-width stroke-linecap stroke-linejoin stroke-opacity]
+      stroke-width stroke-linecap stroke-linejoin stroke-opacity]
 
     ACCEPTABLE_PROTOCOLS = %w[ed2k ftp http https irc mailto news gopher nntp
-        telnet webcal xmpp callto feed urn aim rsync tag ssh sftp rtsp afs]
+      telnet webcal xmpp callto feed urn aim rsync tag ssh sftp rtsp afs]
 
     # subclasses may define their own versions of these constants
     ALLOWED_ELEMENTS = ACCEPTABLE_ELEMENTS + MATHML_ELEMENTS + SVG_ELEMENTS
@@ -104,75 +104,74 @@ class HTMLSanitizer < HTMLTokenizer
     # in ALLOWED_PROTOCOLS are allowed.
     #
     #   sanitize_html('<script> do_nasty_stuff() </script>')
-    #    => &lt;script> do_nasty_stuff() &lt;/script>
+    #  => &lt;script> do_nasty_stuff() &lt;/script>
     #   sanitize_html('<a href="javascript: sucker();">Click here for $100</a>')
-    #    => <a>Click here for $100</a>
+    #  => <a>Click here for $100</a>
     def each
-        super do |token|
-            case token[:type]
-            when :StartTag, :EndTag, :EmptyTag
-                if ALLOWED_ELEMENTS.include?(token[:name])
-                    if token.has_key? :data
-                        attrs = Hash[*token[:data].flatten]
-                        attrs.delete_if { |attr,v| !ALLOWED_ATTRIBUTES.include?(attr) }
-                        ATTR_VAL_IS_URI.each do |attr|
-                            val_unescaped = CGI.unescapeHTML(attrs[attr].to_s).gsub(/[\000-\040\177\s]+|\302[\200-\240]/,'').downcase
-                            if val_unescaped =~ /^[a-z0-9][-+.a-z0-9]*:/ and !ALLOWED_PROTOCOLS.include?(val_unescaped.split(':')[0])
-                                attrs.delete attr
-                            end
-                        end
-                        if attrs['style']
-                            attrs['style'] = sanitize_css(attrs['style'])
-                        end
-                        token[:data] = attrs.map {|k,v| [k,v]}
-                    end
-                    yield token
-                else
-                    if token[:type] == :EndTag
-                        token[:data] = "</#{token[:name]}>"
-                    elsif token[:data]
-                        attrs = token[:data].map {|k,v| " #{k}=\"#{CGI.escapeHTML(v)}\""}.join('')
-                        token[:data] = "<#{token[:name]}#{attrs}>"
-                    else
-                        token[:data] = "<#{token[:name]}>"
-                    end
-                    token[:data].insert(-2,'/') if token[:type] == :EmptyTag
-                    token[:type] = :Characters
-                    token.delete(:name)
-                    yield token
+      super do |token|
+        case token[:type]
+        when :StartTag, :EndTag, :EmptyTag
+          if ALLOWED_ELEMENTS.include?(token[:name])
+            if token.has_key? :data
+              attrs = Hash[*token[:data].flatten]
+              attrs.delete_if { |attr,v| !ALLOWED_ATTRIBUTES.include?(attr) }
+              ATTR_VAL_IS_URI.each do |attr|
+                val_unescaped = CGI.unescapeHTML(attrs[attr].to_s).gsub(/[\000-\040\177\s]+|\302[\200-\240]/,'').downcase
+                if val_unescaped =~ /^[a-z0-9][-+.a-z0-9]*:/ and !ALLOWED_PROTOCOLS.include?(val_unescaped.split(':')[0])
+                  attrs.delete attr
                 end
-            else
-                yield token
-            end
-
-          end
-      end
-
-      def sanitize_css(style)
-          # disallow urls
-          style = style.to_s.gsub(/url\s*\(\s*[^\s)]+?\s*\)\s*/, ' ')
-
-          # gauntlet
-          return '' unless style =~ /^([:,;#%.\sa-zA-Z0-9!]|\w-\w|\'[\s\w]+\'|\"[\s\w]+\"|\([\d,\s]+\))*$/
-          return '' unless style =~ /^(\s*[-\w]+\s*:\s*[^:;]*(;|$))*$/
-
-          clean = []
-          style.scan(/([-\w]+)\s*:\s*([^:;]*)/) do |prop,val|
-              next if val.empty?
-              prop.downcase!
-              if ALLOWED_CSS_PROPERTIES.include?(prop)
-                  clean << "#{prop}: #{val};"
-              elsif %w[background border margin padding].include?(prop.split('-')[0])
-                  clean << "#{prop}: #{val};" unless val.split().any? do |keyword|
-                      !ALLOWED_CSS_KEYWORDS.include?(keyword) and
-                      keyword !~ /^(#[0-9a-f]+|rgb\(\d+%?,\d*%?,?\d*%?\)?|\d{0,2}\.?\d{0,2}(cm|em|ex|in|mm|pc|pt|px|%|,|\))?)$/
-                  end
-              elsif ALLOWED_SVG_PROPERTIES.include?(prop)
-                  clean << "#{prop}: #{val};"
               end
+              if attrs['style']
+                attrs['style'] = sanitize_css(attrs['style'])
+              end
+              token[:data] = attrs.map {|k,v| [k,v]}
+            end
+            yield token
+          else
+            if token[:type] == :EndTag
+              token[:data] = "</#{token[:name]}>"
+            elsif token[:data]
+              attrs = token[:data].map {|k,v| " #{k}=\"#{CGI.escapeHTML(v)}\""}.join('')
+              token[:data] = "<#{token[:name]}#{attrs}>"
+            else
+              token[:data] = "<#{token[:name]}>"
+            end
+            token[:data].insert(-2,'/') if token[:type] == :EmptyTag
+            token[:type] = :Characters
+            token.delete(:name)
+            yield token
           end
-
-          style = clean.join(' ')
+        else
+          yield token
+        end
       end
-end
+    end
+
+    def sanitize_css(style)
+      # disallow urls
+      style = style.to_s.gsub(/url\s*\(\s*[^\s)]+?\s*\)\s*/, ' ')
+
+      # gauntlet
+      return '' unless style =~ /^([:,;#%.\sa-zA-Z0-9!]|\w-\w|\'[\s\w]+\'|\"[\s\w]+\"|\([\d,\s]+\))*$/
+      return '' unless style =~ /^(\s*[-\w]+\s*:\s*[^:;]*(;|$))*$/
+
+      clean = []
+      style.scan(/([-\w]+)\s*:\s*([^:;]*)/) do |prop, val|
+        next if val.empty?
+        prop.downcase!
+        if ALLOWED_CSS_PROPERTIES.include?(prop)
+          clean << "#{prop}: #{val};"
+        elsif %w[background border margin padding].include?(prop.split('-')[0])
+          clean << "#{prop}: #{val};" unless val.split().any? do |keyword|
+            !ALLOWED_CSS_KEYWORDS.include?(keyword) and
+            keyword !~ /^(#[0-9a-f]+|rgb\(\d+%?,\d*%?,?\d*%?\)?|\d{0,2}\.?\d{0,2}(cm|em|ex|in|mm|pc|pt|px|%|,|\))?)$/
+          end
+        elsif ALLOWED_SVG_PROPERTIES.include?(prop)
+          clean << "#{prop}: #{val};"
+        end
+      end
+
+      style = clean.join(' ')
+    end
+  end
 end
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/tokenizer.rb b/vendor/plugins/HTML5lib/lib/html5lib/tokenizer.rb
index c00760d3..4c99b10d 100644
--- a/vendor/plugins/HTML5lib/lib/html5lib/tokenizer.rb
+++ b/vendor/plugins/HTML5lib/lib/html5lib/tokenizer.rb
@@ -3,63 +3,63 @@ require 'html5lib/inputstream'
 
 module HTML5lib
 
-# This class takes care of tokenizing HTML.
-#
-# * @currentToken
-#   Holds the token that is currently being processed.
-#
-# * @state
-#   Holds a reference to the method to be invoked... XXX
-#
-# * @states
-#   Holds a mapping between states and methods that implement the state.
-#
-# * @stream
-#   Points to HTMLInputStream object.
+  # This class takes care of tokenizing HTML.
+  #
+  # * @currentToken
+  #   Holds the token that is currently being processed.
+  #
+  # * @state
+  #   Holds a reference to the method to be invoked... XXX
+  #
+  # * @states
+  #   Holds a mapping between states and methods that implement the state.
+  #
+  # * @stream
+  #   Points to HTMLInputStream object.
 
-class HTMLTokenizer
+  class HTMLTokenizer
     attr_accessor :contentModelFlag, :currentToken
     attr_reader :stream
 
     # XXX need to fix documentation
 
-    def initialize(stream, options={})
-        @stream = HTMLInputStream.new(stream, options)
+    def initialize(stream, options = {})
+      @stream = HTMLInputStream.new(stream, options)
 
-        @states = {
-            :data => :dataState,
-            :entityData => :entityDataState,
-            :tagOpen => :tagOpenState,
-            :closeTagOpen => :closeTagOpenState,
-            :tagName => :tagNameState,
-            :beforeAttributeName => :beforeAttributeNameState,
-            :attributeName => :attributeNameState,
-            :afterAttributeName => :afterAttributeNameState,
-            :beforeAttributeValue => :beforeAttributeValueState,
-            :attributeValueDoubleQuoted => :attributeValueDoubleQuotedState,
-            :attributeValueSingleQuoted => :attributeValueSingleQuotedState,
-            :attributeValueUnQuoted => :attributeValueUnQuotedState,
-            :bogusComment => :bogusCommentState,
-            :markupDeclarationOpen => :markupDeclarationOpenState,
-            :comment => :commentState,
-            :commentDash => :commentDashState,
-            :commentEnd => :commentEndState,
-            :doctype => :doctypeState,
-            :beforeDoctypeName => :beforeDoctypeNameState,
-            :doctypeName => :doctypeNameState,
-            :afterDoctypeName => :afterDoctypeNameState,
-            :bogusDoctype => :bogusDoctypeState
-        }
+      @states = {
+        :data => :dataState,
+        :entityData => :entityDataState,
+        :tagOpen => :tagOpenState,
+        :closeTagOpen => :closeTagOpenState,
+        :tagName => :tagNameState,
+        :beforeAttributeName => :beforeAttributeNameState,
+        :attributeName => :attributeNameState,
+        :afterAttributeName => :afterAttributeNameState,
+        :beforeAttributeValue => :beforeAttributeValueState,
+        :attributeValueDoubleQuoted => :attributeValueDoubleQuotedState,
+        :attributeValueSingleQuoted => :attributeValueSingleQuotedState,
+        :attributeValueUnQuoted => :attributeValueUnQuotedState,
+        :bogusComment => :bogusCommentState,
+        :markupDeclarationOpen => :markupDeclarationOpenState,
+        :comment => :commentState,
+        :commentDash => :commentDashState,
+        :commentEnd => :commentEndState,
+        :doctype => :doctypeState,
+        :beforeDoctypeName => :beforeDoctypeNameState,
+        :doctypeName => :doctypeNameState,
+        :afterDoctypeName => :afterDoctypeNameState,
+        :bogusDoctype => :bogusDoctypeState
+      }
 
-        # Setup the initial tokenizer state
-        @contentModelFlag = :PCDATA
-        @state = @states[:data]
+      # Setup the initial tokenizer state
+      @contentModelFlag = :PCDATA
+      @state = @states[:data]
 
-        # The current token being created
-        @currentToken = nil
+      # The current token being created
+      @currentToken = nil
 
-        # Tokens to be processed.
-        @tokenQueue = []
+      # Tokens to be processed.
+      @tokenQueue = []
     end
 
     # This is where the magic happens.
@@ -68,37 +68,37 @@ class HTMLTokenizer
     # to return we yield the token which pauses processing until the next token
     # is requested.
     def each
-        @stream.reset
-        @tokenQueue = []
-        # Start processing. When EOF is reached @state will return false
-        # instead of true and the loop will terminate.
-        while send @state
-            while not @tokenQueue.empty?
-                yield @tokenQueue.shift
-            end
+      @stream.reset
+      @tokenQueue = []
+      # Start processing. When EOF is reached @state will return false
+      # instead of true and the loop will terminate.
+      while send @state
+        while not @tokenQueue.empty?
+          yield @tokenQueue.shift
         end
+      end
     end
 
     # Below are various helper functions the tokenizer states use worked out.
-    
+  
     # If the next character is a '>', convert the currentToken into
     # an EmptyTag
 
     def processSolidusInTag
 
-        # We need to consume another character to make sure it's a ">"
-        data = @stream.char
+      # We need to consume another character to make sure it's a ">"
+      data = @stream.char
 
-        if @currentToken[:type] == :StartTag and data == ">"
-            @currentToken[:type] = :EmptyTag
-        else
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Solidus (/) incorrectly placed in tag.")})
-        end
+      if @currentToken[:type] == :StartTag and data == ">"
+        @currentToken[:type] = :EmptyTag
+      else
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Solidus (/) incorrectly placed in tag.")})
+      end
 
-        # The character we just consumed need to be put back on the stack so it
-        # doesn't get lost...
-        @stream.queue.push(data)
+      # The character we just consumed need to be put back on the stack so it
+      # doesn't get lost...
+      @stream.queue.push(data)
     end
 
     # This function returns either U+FFFD or the character based on the
@@ -107,748 +107,746 @@ class HTMLTokenizer
 
     def consumeNumberEntity(isHex)
 
-        # XXX More need to be done here. For instance, #13 should prolly be
-        # converted to #10 so we don't get \r (#13 is \r right?) in the DOM and
-        # such. Thoughts on this appreciated.
-        allowed = DIGITS
-        radix = 10
-        if isHex
-            allowed = HEX_DIGITS
-            radix = 16
-        end
+      # XXX More need to be done here. For instance, #13 should prolly be
+      # converted to #10 so we don't get \r (#13 is \r right?) in the DOM and
+      # such. Thoughts on this appreciated.
+      allowed = DIGITS
+      radix = 10
+      if isHex
+        allowed = HEX_DIGITS
+        radix = 16
+      end
 
-        char = [0xFFFD].pack('U')
-        charStack = []
+      char = [0xFFFD].pack('U')
+      charStack = []
 
-        # Consume all the characters that are in range while making sure we
-        # don't hit an EOF.
+      # Consume all the characters that are in range while making sure we
+      # don't hit an EOF.
+      c = @stream.char
+      while allowed.include?(c) and c != :EOF
+        charStack.push(c)
         c = @stream.char
-        while allowed.include?(c) and c != :EOF
-            charStack.push(c)
-            c = @stream.char
-        end
+      end
 
-        # Convert the set of characters consumed to an int.
-        charAsInt = charStack.join('').to_i(radix)
+      # Convert the set of characters consumed to an int.
+      charAsInt = charStack.join('').to_i(radix)
 
-        # If the integer is between 127 and 160 (so 128 and bigger and 159 and
-        # smaller) we need to do the "windows trick".
-        if (127...160).include? charAsInt
-            #XXX - removed parse error from windows 1252 entity for now
-            #we may want to reenable this later
-            #@tokenQueue.push({:type => :ParseError, :data =>
-            #  _("Entity used with illegal number (windows-1252 reference).")})
+      # If the integer is between 127 and 160 (so 128 and bigger and 159 and
+      # smaller) we need to do the "windows trick".
+      if (127...160).include? charAsInt
+        #XXX - removed parse error from windows 1252 entity for now
+        #we may want to reenable this later
+        #@tokenQueue.push({:type => :ParseError, :data =>
+        #  _("Entity used with illegal number (windows-1252 reference).")})
 
-            charAsInt = ENTITIES_WINDOWS1252[charAsInt - 128]
-        end
+        charAsInt = ENTITIES_WINDOWS1252[charAsInt - 128]
+      end
 
-        # 0 is not a good number.
-        if charAsInt == 0
-            charAsInt = 65533
-        end
+      # 0 is not a good number.
+      if charAsInt == 0
+        charAsInt = 65533
+      end
 
-        if charAsInt <= 0x10FFF
-            char = [charAsInt].pack('U')
-        else
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Numeric entity couldn't be converted to character.")})
-        end
+      if charAsInt <= 0x10FFFF
+        char = [charAsInt].pack('U')
+      else
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Numeric entity couldn't be converted to character.")})
+      end
 
-        # Discard the ; if present. Otherwise, put it back on the queue and
-        # invoke parseError on parser.
-        if c != ";"
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Numeric entity didn't end with ';'.")})
-            @stream.queue.push(c)
-        end
+      # Discard the ; if present. Otherwise, put it back on the queue and
+      # invoke parseError on parser.
+      if c != ";"
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Numeric entity didn't end with ';'.")})
+        @stream.queue.push(c)
+      end
 
-        return char
+      return char
     end
 
     def consumeEntity
-        char = nil
-        charStack = [@stream.char]
-        if charStack[0] == "#"
-            # We might have a number entity here.
-            charStack += [@stream.char, @stream.char]
-            if charStack.include? :EOF
-                # If we reach the end of the file put everything up to :EOF
-                # back in the queue
-                charStack = charStack[0...charStack.index(:EOF)]
-                @stream.queue+= charStack
-                @tokenQueue.push({:type => :ParseError, :data =>
-                  _("Numeric entity expected. Got end of file instead.")})
-            else
-                if charStack[1].downcase == "x" \
-                  and HEX_DIGITS.include? charStack[2]
-                    # Hexadecimal entity detected.
-                    @stream.queue.push(charStack[2])
-                    char = consumeNumberEntity(true)
-                elsif DIGITS.include? charStack[1]
-                    # Decimal entity detected.
-                    @stream.queue += charStack[1..-1]
-                    char = consumeNumberEntity(false)
-                else
-                    # No number entity detected.
-                    @stream.queue += charStack
-                    @tokenQueue.push({:type => :ParseError, :data =>
-                      _("Numeric entity expected but none found.")})
-                end
-            end
-        # Break out if we reach the end of the file
-        elsif charStack[0] == :EOF
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Entity expected. Got end of file instead.")})
+      char = nil
+      charStack = [@stream.char]
+      if charStack[0] == "#"
+        # We might have a number entity here.
+        charStack += [@stream.char, @stream.char]
+        if charStack.include? :EOF
+          # If we reach the end of the file put everything up to :EOF
+          # back in the queue
+          charStack = charStack[0...charStack.index(:EOF)]
+          @stream.queue+= charStack
+          @tokenQueue.push({:type => :ParseError, :data =>
+            _("Numeric entity expected. Got end of file instead.")})
         else
-            # At this point in the process might have named entity. Entities
-            # are stored in the global variable "entities".
-            #
-            # Consume characters and compare to these to a substring of the
-            # entity names in the list until the substring no longer matches.
-            filteredEntityList = ENTITIES.keys
-            filteredEntityList.reject! {|e| e[0].chr != charStack[0]}
-            entityName = nil
-
-            while charStack[-1] != :EOF
-                name = charStack.join('')
-                if filteredEntityList.any? {|e| e[0...name.length] == name}
-                    filteredEntityList.reject! {|e| e[0...name.length] != name}
-                    charStack.push(@stream.char)
-                else
-                    break
-                end
-
-                if ENTITIES.include? name
-                    entityName = name
-                end
-            end
-
-            if entityName != nil
-                char = ENTITIES[entityName]
-
-                # Check whether or not the last character returned can be
-                # discarded or needs to be put back.
-                if not charStack[-1] == ";"
-                    @tokenQueue.push({:type => :ParseError, :data =>
-                      _("Named entity didn't end with ';'.")})
-                    @stream.queue += charStack[entityName.length..-1]
-                end
-            else
-                @tokenQueue.push({:type => :ParseError, :data =>
-                  _("Named entity expected. Got none.")})
-                @stream.queue += charStack
-            end
+          if charStack[1].downcase == "x" \
+            and HEX_DIGITS.include? charStack[2]
+            # Hexadecimal entity detected.
+            @stream.queue.push(charStack[2])
+            char = consumeNumberEntity(true)
+          elsif DIGITS.include? charStack[1]
+            # Decimal entity detected.
+            @stream.queue += charStack[1..-1]
+            char = consumeNumberEntity(false)
+          else
+            # No number entity detected.
+            @stream.queue += charStack
+            @tokenQueue.push({:type => :ParseError, :data =>
+              _("Numeric entity expected but none found.")})
+          end
         end
-        return char
+      # Break out if we reach the end of the file
+      elsif charStack[0] == :EOF
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Entity expected. Got end of file instead.")})
+      else
+        # At this point in the process might have named entity. Entities
+        # are stored in the global variable "entities".
+        #
+        # Consume characters and compare to these to a substring of the
+        # entity names in the list until the substring no longer matches.
+        filteredEntityList = ENTITIES.keys
+        filteredEntityList.reject! {|e| e[0].chr != charStack[0]}
+        entityName = nil
+
+        while charStack[-1] != :EOF
+          name = charStack.join('')
+          if filteredEntityList.any? {|e| e[0...name.length] == name}
+            filteredEntityList.reject! {|e| e[0...name.length] != name}
+            charStack.push(@stream.char)
+          else
+            break
+          end
+
+          if ENTITIES.include? name
+            entityName = name
+          end
+        end
+
+        if entityName != nil
+          char = ENTITIES[entityName]
+
+          # Check whether or not the last character returned can be
+          # discarded or needs to be put back.
+          if not charStack[-1] == ";"
+            @tokenQueue.push({:type => :ParseError, :data =>
+              _("Named entity didn't end with ';'.")})
+            @stream.queue += charStack[entityName.length..-1]
+          end
+        else
+          @tokenQueue.push({:type => :ParseError, :data =>
+            _("Named entity expected. Got none.")})
+          @stream.queue += charStack
+        end
+      end
+      return char
     end
 
     # This method replaces the need for "entityInAttributeValueState".
     def processEntityInAttribute
-        entity = consumeEntity
-        if entity
-            @currentToken[:data][-1][1] += entity
-        else
-            @currentToken[:data][-1][1] += "&"
-        end
+      entity = consumeEntity
+      if entity
+        @currentToken[:data][-1][1] += entity
+      else
+        @currentToken[:data][-1][1] += "&"
+      end
     end
 
     # This method is a generic handler for emitting the tags. It also sets
     # the state to "data" because that's what's needed after a token has been
     # emitted.
     def emitCurrentToken
-        # Add token to the queue to be yielded
-        @tokenQueue.push(@currentToken)
-        @state = @states[:data]
+      # Add token to the queue to be yielded
+      @tokenQueue.push(@currentToken)
+      @state = @states[:data]
     end
 
-
     # Below are the various tokenizer states worked out.
 
     # XXX AT Perhaps we should have Hixie run some evaluation on billions of
     # documents to figure out what the order of the various if and elsif
     # statements should be.
-
     def dataState
-        data = @stream.char
-        if data == "&" and (@contentModelFlag == :PCDATA or
-            @contentModelFlag == :RCDATA)
-            @state = @states[:entityData]
-        elsif data == "<" and @contentModelFlag != :PLAINTEXT
-            @state = @states[:tagOpen]
-        elsif data == :EOF
-            # Tokenization ends.
-            return false
-        elsif SPACE_CHARACTERS.include? data
-            # Directly after emitting a token you switch back to the "data
-            # state". At that point SPACE_CHARACTERS are important so they are
-            # emitted separately.
-            # XXX need to check if we don't need a special "spaces" flag on
-            # characters.
-            @tokenQueue.push({:type => :SpaceCharacters, :data =>
-              data + @stream.charsUntil(SPACE_CHARACTERS, true)})
-        else
-            @tokenQueue.push({:type => :Characters, :data => 
-              data + @stream.charsUntil(["&", "<"])})
-        end
-        return true
+      data = @stream.char
+      if data == "&" and (@contentModelFlag == :PCDATA or
+        @contentModelFlag == :RCDATA)
+        @state = @states[:entityData]
+      elsif data == "<" and @contentModelFlag != :PLAINTEXT
+        @state = @states[:tagOpen]
+      elsif data == :EOF
+        # Tokenization ends.
+        return false
+      elsif SPACE_CHARACTERS.include? data
+        # Directly after emitting a token you switch back to the "data
+        # state". At that point SPACE_CHARACTERS are important so they are
+        # emitted separately.
+        # XXX need to check if we don't need a special "spaces" flag on
+        # characters.
+        @tokenQueue.push({:type => :SpaceCharacters, :data =>
+          data + @stream.chars_until(SPACE_CHARACTERS, true)})
+      else
+        @tokenQueue.push({:type => :Characters, :data => 
+          data + @stream.chars_until(["&", "<"])})
+      end
+      return true
     end
 
     def entityDataState
-        entity = consumeEntity
-        if entity
-            @tokenQueue.push({:type => :Characters, :data => entity})
-        else
-            @tokenQueue.push({:type => :Characters, :data => "&"})
-        end
-        @state = @states[:data]
-        return true
+      entity = consumeEntity
+      if entity
+        @tokenQueue.push({:type => :Characters, :data => entity})
+      else
+        @tokenQueue.push({:type => :Characters, :data => "&"})
+      end
+      @state = @states[:data]
+      return true
     end
 
     def tagOpenState
-        data = @stream.char
-        if @contentModelFlag == :PCDATA
-            if data == "!"
-                @state = @states[:markupDeclarationOpen]
-            elsif data == "/"
-                @state = @states[:closeTagOpen]
-            elsif data != :EOF and ASCII_LETTERS.include? data
-                @currentToken =\
-                  {:type => :StartTag, :name => data, :data => []}
-                @state = @states[:tagName]
-            elsif data == ">"
-                # XXX In theory it could be something besides a tag name. But
-                # do we really care?
-                @tokenQueue.push({:type => :ParseError, :data =>
-                  _("Expected tag name. Got '>' instead.")})
-                @tokenQueue.push({:type => :Characters, :data => "<>"})
-                @state = @states[:data]
-            elsif data == "?"
-                # XXX In theory it could be something besides a tag name. But
-                # do we really care?
-                @tokenQueue.push({:type => :ParseError, :data =>
-                  _("Expected tag name. Got '?' instead (HTML doesn't " +
-                  "support processing instructions).")})
-                @stream.queue.push(data)
-                @state = @states[:bogusComment]
-            else
-                # XXX
-                @tokenQueue.push({:type => :ParseError, :data =>
-                  _("Expected tag name. Got something else instead")})
-                @tokenQueue.push({:type => :Characters, :data => "<"})
-                @stream.queue.push(data)
-                @state = @states[:data]
-            end
+      data = @stream.char
+      if @contentModelFlag == :PCDATA
+        if data == "!"
+          @state = @states[:markupDeclarationOpen]
+        elsif data == "/"
+          @state = @states[:closeTagOpen]
+        elsif data != :EOF and ASCII_LETTERS.include? data
+          @currentToken =\
+            {:type => :StartTag, :name => data, :data => []}
+          @state = @states[:tagName]
+        elsif data == ">"
+          # XXX In theory it could be something besides a tag name. But
+          # do we really care?
+          @tokenQueue.push({:type => :ParseError, :data =>
+            _("Expected tag name. Got '>' instead.")})
+          @tokenQueue.push({:type => :Characters, :data => "<>"})
+          @state = @states[:data]
+        elsif data == "?"
+          # XXX In theory it could be something besides a tag name. But
+          # do we really care?
+          @tokenQueue.push({:type => :ParseError, :data =>
+            _("Expected tag name. Got '?' instead (HTML doesn't " +
+            "support processing instructions).")})
+          @stream.queue.push(data)
+          @state = @states[:bogusComment]
         else
-            # We know the content model flag is set to either RCDATA or CDATA
-            # now because this state can never be entered with the PLAINTEXT
-            # flag.
-            if data == "/"
-                @state = @states[:closeTagOpen]
-            else
-                @tokenQueue.push({:type => :Characters, :data => "<"})
-                @stream.queue.insert(0, data)
-                @state = @states[:data]
-            end
+          # XXX
+          @tokenQueue.push({:type => :ParseError, :data =>
+            _("Expected tag name. Got something else instead")})
+          @tokenQueue.push({:type => :Characters, :data => "<"})
+          @stream.queue.push(data)
+          @state = @states[:data]
         end
-        return true
+      else
+        # We know the content model flag is set to either RCDATA or CDATA
+        # now because this state can never be entered with the PLAINTEXT
+        # flag.
+        if data == "/"
+          @state = @states[:closeTagOpen]
+        else
+          @tokenQueue.push({:type => :Characters, :data => "<"})
+          @stream.queue.insert(0, data)
+          @state = @states[:data]
+        end
+      end
+      return true
     end
 
     def closeTagOpenState
-        if (@contentModelFlag == :RCDATA or @contentModelFlag == :CDATA)
-            if @currentToken
-                charStack = []
+      if (@contentModelFlag == :RCDATA or @contentModelFlag == :CDATA)
+        if @currentToken
+          charStack = []
 
-                # So far we know that "</" has been consumed. We now need to know
-                # whether the next few characters match the name of last emitted
-                # start tag which also happens to be the currentToken. We also need
-                # to have the character directly after the characters that could
-                # match the start tag name.
-                (@currentToken[:name].length + 1).times do
-                    charStack.push(@stream.char)
-                    # Make sure we don't get hit by :EOF
-                    break if charStack[-1] == :EOF
-                end
+          # So far we know that "</" has been consumed. We now need to know
+          # whether the next few characters match the name of last emitted
+          # start tag which also happens to be the currentToken. We also need
+          # to have the character directly after the characters that could
+          # match the start tag name.
+          (@currentToken[:name].length + 1).times do
+            charStack.push(@stream.char)
+            # Make sure we don't get hit by :EOF
+            break if charStack[-1] == :EOF
+          end
 
-                # Since this is just for checking. We put the characters back on
-                # the stack.
-                @stream.queue += charStack
-            end
-
-            if @currentToken and
-              @currentToken[:name].downcase == 
-                charStack[0...-1].join('').downcase and
-              (SPACE_CHARACTERS + [">", "/", "<", :EOF]).include? charStack[-1]
-                # Because the characters are correct we can safely switch to
-                # PCDATA mode now. This also means we don't have to do it when
-                # emitting the end tag token.
-                @contentModelFlag = :PCDATA
-            else
-                @tokenQueue.push({:type => :ParseError, :data =>
-                  _("Expected closing tag after seeing '</'. None found.")})
-                @tokenQueue.push({:type => :Characters, :data => "</"})
-                @state = @states[:data]
-
-                # Need to return here since we don't want the rest of the
-                # method to be walked through.
-                return true
-            end
+          # Since this is just for checking. We put the characters back on
+          # the stack.
+          @stream.queue += charStack
         end
 
-        if @contentModelFlag == :PCDATA
-            data = @stream.char
-            if data == :EOF
-                @tokenQueue.push({:type => :ParseError, :data =>
-                  _("Expected closing tag. Unexpected end of file.")})
-                @tokenQueue.push({:type => :Characters, :data => "</"})
-                @state = @states[:data]
-            elsif ASCII_LETTERS.include? data
-                @currentToken =\
-                  {:type => :EndTag, :name => data, :data => []}
-                @state = @states[:tagName]
-            elsif data == ">"
-                @tokenQueue.push({:type => :ParseError, :data =>
-                  _("Expected closing tag. Got '>' instead. Ignoring '</>'.")})
-                @state = @states[:data]
-            else
-                # XXX data can be _'_...
-                @tokenQueue.push({:type => :ParseError, :data =>
-                  _("Expected closing tag. Unexpected character '" + data + "' found.")})
-                @stream.queue.push(data)
-                @state = @states[:bogusComment]
-            end
+        if @currentToken and
+          @currentToken[:name].downcase == 
+          charStack[0...-1].join('').downcase and
+          (SPACE_CHARACTERS + [">", "/", "<", :EOF]).include? charStack[-1]
+          # Because the characters are correct we can safely switch to
+          # PCDATA mode now. This also means we don't have to do it when
+          # emitting the end tag token.
+          @contentModelFlag = :PCDATA
+        else
+          @tokenQueue.push({:type => :ParseError, :data =>
+            _("Expected closing tag after seeing '</'. None found.")})
+          @tokenQueue.push({:type => :Characters, :data => "</"})
+          @state = @states[:data]
+
+          # Need to return here since we don't want the rest of the
+          # method to be walked through.
+          return true
         end
-        return true
+      end
+
+      if @contentModelFlag == :PCDATA
+        data = @stream.char
+        if data == :EOF
+          @tokenQueue.push({:type => :ParseError, :data =>
+            _("Expected closing tag. Unexpected end of file.")})
+          @tokenQueue.push({:type => :Characters, :data => "</"})
+          @state = @states[:data]
+        elsif ASCII_LETTERS.include? data
+          @currentToken =\
+            {:type => :EndTag, :name => data, :data => []}
+          @state = @states[:tagName]
+        elsif data == ">"
+          @tokenQueue.push({:type => :ParseError, :data =>
+            _("Expected closing tag. Got '>' instead. Ignoring '</>'.")})
+          @state = @states[:data]
+        else
+          # XXX data can be _'_...
+          @tokenQueue.push({:type => :ParseError, :data =>
+            _("Expected closing tag. Unexpected character '" + data + "' found.")})
+          @stream.queue.push(data)
+          @state = @states[:bogusComment]
+        end
+      end
+      return true
     end
 
     def tagNameState
-        data = @stream.char
-        if SPACE_CHARACTERS.include? data
-            @state = @states[:beforeAttributeName]
-        elsif data == :EOF
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file in the tag name.")})
-            emitCurrentToken
-        elsif ASCII_LETTERS.include? data
-            @currentToken[:name] += data +\
-              @stream.charsUntil(ASCII_LETTERS, true)
-        elsif data == ">"
-            emitCurrentToken
-        elsif data == "<"
-            @stream.queue.push(data)
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected < character when getting the tag name.")})
-            emitCurrentToken
-        elsif data == "/"
-            processSolidusInTag
-            @state = @states[:beforeAttributeName]
-        else
-            @currentToken[:name] += data
-        end
-        return true
+      data = @stream.char
+      if SPACE_CHARACTERS.include? data
+        @state = @states[:beforeAttributeName]
+      elsif data == :EOF
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file in the tag name.")})
+        emitCurrentToken
+      elsif ASCII_LETTERS.include? data
+        @currentToken[:name] += data +\
+          @stream.chars_until(ASCII_LETTERS, true)
+      elsif data == ">"
+        emitCurrentToken
+      elsif data == "<"
+        @stream.queue.push(data)
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected < character when getting the tag name.")})
+        emitCurrentToken
+      elsif data == "/"
+        processSolidusInTag
+        @state = @states[:beforeAttributeName]
+      else
+        @currentToken[:name] += data
+      end
+      return true
     end
 
     def beforeAttributeNameState
-        data = @stream.char
-        if SPACE_CHARACTERS.include? data
-            @stream.charsUntil(SPACE_CHARACTERS, true)
-        elsif data == :EOF
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file. Expected attribute name instead.")})
-            emitCurrentToken
-        elsif ASCII_LETTERS.include? data
-            @currentToken[:data].push([data, ""])
-            @state = @states[:attributeName]
-        elsif data == ">"
-            emitCurrentToken
-        elsif data == "/"
-            processSolidusInTag
-        elsif data == "<"
-            @stream.queue.push(data)
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected < character. Expected attribute name instead.")})
-            emitCurrentToken
-        else
-            @currentToken[:data].push([data, ""])
-            @state = @states[:attributeName]
-        end
-        return true
+      data = @stream.char
+      if SPACE_CHARACTERS.include? data
+        @stream.chars_until(SPACE_CHARACTERS, true)
+      elsif data == :EOF
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file. Expected attribute name instead.")})
+        emitCurrentToken
+      elsif ASCII_LETTERS.include? data
+        @currentToken[:data].push([data, ""])
+        @state = @states[:attributeName]
+      elsif data == ">"
+        emitCurrentToken
+      elsif data == "/"
+        processSolidusInTag
+      elsif data == "<"
+        @stream.queue.push(data)
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected < character. Expected attribute name instead.")})
+        emitCurrentToken
+      else
+        @currentToken[:data].push([data, ""])
+        @state = @states[:attributeName]
+      end
+      return true
     end
 
     def attributeNameState
-        data = @stream.char
-        leavingThisState = true
-        if data == "="
-            @state = @states[:beforeAttributeValue]
-        elsif data == :EOF
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file in attribute name.")})
-            emitCurrentToken
-            leavingThisState = false
-        elsif ASCII_LETTERS.include? data
-            @currentToken[:data][-1][0] += data +\
-              @stream.charsUntil(ASCII_LETTERS, true)
-            leavingThisState = false
-        elsif data == ">"
-            # XXX If we emit here the attributes are converted to a dict
-            # without being checked and when the code below runs we error
-            # because data is a dict not a list
-        elsif SPACE_CHARACTERS.include? data
-            @state = @states[:afterAttributeName]
-        elsif data == "/"
-            processSolidusInTag
-            @state = @states[:beforeAttributeName]
-        elsif data == "<"
-            @stream.queue.push(data)
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected < character in attribute name.")})
-            emitCurrentToken
-            leavingThisState = false
-        else
-            @currentToken[:data][-1][0] += data
-            leavingThisState = false
-        end
+      data = @stream.char
+      leavingThisState = true
+      if data == "="
+        @state = @states[:beforeAttributeValue]
+      elsif data == :EOF
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file in attribute name.")})
+        emitCurrentToken
+        leavingThisState = false
+      elsif ASCII_LETTERS.include? data
+        @currentToken[:data][-1][0] += data +\
+          @stream.chars_until(ASCII_LETTERS, true)
+        leavingThisState = false
+      elsif data == ">"
+        # XXX If we emit here the attributes are converted to a dict
+        # without being checked and when the code below runs we error
+        # because data is a dict not a list
+      elsif SPACE_CHARACTERS.include? data
+        @state = @states[:afterAttributeName]
+      elsif data == "/"
+        processSolidusInTag
+        @state = @states[:beforeAttributeName]
+      elsif data == "<"
+        @stream.queue.push(data)
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected < character in attribute name.")})
+        emitCurrentToken
+        leavingThisState = false
+      else
+        @currentToken[:data][-1][0] += data
+        leavingThisState = false
+      end
 
-        if leavingThisState
-            # Attributes are not dropped at this stage. That happens when the
-            # start tag token is emitted so values can still be safely appended
-            # to attributes, but we do want to report the parse error in time.
-            @currentToken[:data][0...-1].each {|name,value|
-                if @currentToken[:data][-1][0] == name
-                    @tokenQueue.push({:type => :ParseError, :data =>
-                      _("Dropped duplicate attribute on tag.")})
-                end
-            }
-            # XXX Fix for above XXX
-            if data == ">"
-                emitCurrentToken
-            end
+      if leavingThisState
+        # Attributes are not dropped at this stage. That happens when the
+        # start tag token is emitted so values can still be safely appended
+        # to attributes, but we do want to report the parse error in time.
+        @currentToken[:data][0...-1].each {|name,value|
+          if @currentToken[:data][-1][0] == name
+            @tokenQueue.push({:type => :ParseError, :data =>
+              _("Dropped duplicate attribute on tag.")})
+          end
+        }
+        # XXX Fix for above XXX
+        if data == ">"
+          emitCurrentToken
         end
-        return true
+      end
+      return true
     end
 
     def afterAttributeNameState
-        data = @stream.char
-        if SPACE_CHARACTERS.include? data
-            @stream.charsUntil(SPACE_CHARACTERS, true)
-        elsif data == "="
-            @state = @states[:beforeAttributeValue]
-        elsif data == ">"
-            emitCurrentToken
-        elsif ASCII_LETTERS.include? data
-            @currentToken[:data].push([data, ""])
-            @state = @states[:attributeName]
-        elsif data == "/"
-            processSolidusInTag
-            @state = @states[:beforeAttributeName]
-        elsif data == "<"
-            @stream.queue.push(data)
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected < character. Expected = or end of tag.")})
-            emitCurrentToken
-        elsif data == :EOF
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file. Expected = or end of tag.")})
-            emitCurrentToken
-        else
-            @currentToken[:data].push([data, ""])
-            @state = @states[:attributeName]
-        end
-        return true
+      data = @stream.char
+      if SPACE_CHARACTERS.include? data
+        @stream.chars_until(SPACE_CHARACTERS, true)
+      elsif data == "="
+        @state = @states[:beforeAttributeValue]
+      elsif data == ">"
+        emitCurrentToken
+      elsif ASCII_LETTERS.include? data
+        @currentToken[:data].push([data, ""])
+        @state = @states[:attributeName]
+      elsif data == "/"
+        processSolidusInTag
+        @state = @states[:beforeAttributeName]
+      elsif data == "<"
+        @stream.queue.push(data)
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected < character. Expected = or end of tag.")})
+        emitCurrentToken
+      elsif data == :EOF
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file. Expected = or end of tag.")})
+        emitCurrentToken
+      else
+        @currentToken[:data].push([data, ""])
+        @state = @states[:attributeName]
+      end
+      return true
     end
 
     def beforeAttributeValueState
-        data = @stream.char
-        if SPACE_CHARACTERS.include? data
-            @stream.charsUntil(SPACE_CHARACTERS, true)
-        elsif data == "\""
-            @state = @states[:attributeValueDoubleQuoted]
-        elsif data == "&"
-            @state = @states[:attributeValueUnQuoted]
-            @stream.queue.push(data);
-        elsif data == "'"
-            @state = @states[:attributeValueSingleQuoted]
-        elsif data == ">"
-            emitCurrentToken
-        elsif data == "<"
-            @stream.queue.push(data)
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected < character. Expected attribute value.")})
-            emitCurrentToken
-        elsif data == :EOF
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file. Expected attribute value.")})
-            emitCurrentToken
-        else
-            @currentToken[:data][-1][1] += data
-            @state = @states[:attributeValueUnQuoted]
-        end
-        return true
+      data = @stream.char
+      if SPACE_CHARACTERS.include? data
+        @stream.chars_until(SPACE_CHARACTERS, true)
+      elsif data == "\""
+        @state = @states[:attributeValueDoubleQuoted]
+      elsif data == "&"
+        @state = @states[:attributeValueUnQuoted]
+        @stream.queue.push(data);
+      elsif data == "'"
+        @state = @states[:attributeValueSingleQuoted]
+      elsif data == ">"
+        emitCurrentToken
+      elsif data == "<"
+        @stream.queue.push(data)
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected < character. Expected attribute value.")})
+        emitCurrentToken
+      elsif data == :EOF
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file. Expected attribute value.")})
+        emitCurrentToken
+      else
+        @currentToken[:data][-1][1] += data
+        @state = @states[:attributeValueUnQuoted]
+      end
+      return true
     end
 
     def attributeValueDoubleQuotedState
-        data = @stream.char
-        if data == "\""
-            @state = @states[:beforeAttributeName]
-        elsif data == "&"
-            processEntityInAttribute
-        elsif data == :EOF
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file in attribute value (\").")})
-            emitCurrentToken
-        else
-            @currentToken[:data][-1][1] += data +\
-              @stream.charsUntil(["\"", "&"])
-        end
-        return true
+      data = @stream.char
+      if data == "\""
+        @state = @states[:beforeAttributeName]
+      elsif data == "&"
+        processEntityInAttribute
+      elsif data == :EOF
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file in attribute value (\").")})
+        emitCurrentToken
+      else
+        @currentToken[:data][-1][1] += data +\
+          @stream.chars_until(["\"", "&"])
+      end
+      return true
     end
 
     def attributeValueSingleQuotedState
-        data = @stream.char
-        if data == "'"
-            @state = @states[:beforeAttributeName]
-        elsif data == "&"
-            processEntityInAttribute
-        elsif data == :EOF
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file in attribute value (').")})
-            emitCurrentToken
-        else
-            @currentToken[:data][-1][1] += data +\
-              @stream.charsUntil(["'", "&"])
-        end
-        return true
+      data = @stream.char
+      if data == "'"
+        @state = @states[:beforeAttributeName]
+      elsif data == "&"
+        processEntityInAttribute
+      elsif data == :EOF
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file in attribute value (').")})
+        emitCurrentToken
+      else
+        @currentToken[:data][-1][1] += data +\
+          @stream.chars_until(["'", "&"])
+      end
+      return true
     end
 
     def attributeValueUnQuotedState
-        data = @stream.char
-        if SPACE_CHARACTERS.include? data
-            @state = @states[:beforeAttributeName]
-        elsif data == "&"
-            processEntityInAttribute
-        elsif data == ">"
-            emitCurrentToken
-        elsif data == "<"
-            @stream.queue.push(data)
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected < character in attribute value.")})
-            emitCurrentToken
-        elsif data == :EOF
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file in attribute value.")})
-            emitCurrentToken
-        else
-            @currentToken[:data][-1][1] += data + 
-              @stream.charsUntil(["&", ">","<"] + SPACE_CHARACTERS)
-        end
-        return true
+      data = @stream.char
+      if SPACE_CHARACTERS.include? data
+        @state = @states[:beforeAttributeName]
+      elsif data == "&"
+        processEntityInAttribute
+      elsif data == ">"
+        emitCurrentToken
+      elsif data == "<"
+        @stream.queue.push(data)
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected < character in attribute value.")})
+        emitCurrentToken
+      elsif data == :EOF
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file in attribute value.")})
+        emitCurrentToken
+      else
+        @currentToken[:data][-1][1] += data + 
+          @stream.chars_until(["&", ">","<"] + SPACE_CHARACTERS)
+      end
+      return true
     end
 
     def bogusCommentState
-        # Make a new comment token and give it as value all the characters
-        # until the first > or :EOF (charsUntil checks for :EOF automatically)
-        # and emit it.
-        @tokenQueue.push(
-          {:type => :Comment, :data => @stream.charsUntil((">"))})
+      # Make a new comment token and give it as value all the characters
+      # until the first > or :EOF (chars_until checks for :EOF automatically)
+      # and emit it.
+      @tokenQueue.push(
+        {:type => :Comment, :data => @stream.chars_until((">"))})
 
-        # Eat the character directly after the bogus comment which is either a
-        # ">" or an :EOF.
-        @stream.char
-        @state = @states[:data]
-        return true
+      # Eat the character directly after the bogus comment which is either a
+      # ">" or an :EOF.
+      @stream.char
+      @state = @states[:data]
+      return true
     end
 
     def markupDeclarationOpenState
-        charStack = [@stream.char, @stream.char]
-        if charStack == ["-", "-"]
-            @currentToken = {:type => :Comment, :data => ""}
-            @state = @states[:comment]
+      charStack = [@stream.char, @stream.char]
+      if charStack == ["-", "-"]
+        @currentToken = {:type => :Comment, :data => ""}
+        @state = @states[:comment]
+      else
+        5.times { charStack.push(@stream.char) }
+        # Put in explicit :EOF check
+        if ((not charStack.include? :EOF) and
+          charStack.join("").upcase == "DOCTYPE")
+          @currentToken =\
+            {:type => :Doctype, :name => "", :data => true}
+          @state = @states[:doctype]
         else
-            5.times { charStack.push(@stream.char) }
-            # Put in explicit :EOF check
-            if ((not charStack.include? :EOF) and
-                charStack.join("").upcase == "DOCTYPE")
-                @currentToken =\
-                  {:type => :Doctype, :name => "", :data => true}
-                @state = @states[:doctype]
-            else
-                @tokenQueue.push({:type => :ParseError, :data =>
-                  _("Expected '--' or 'DOCTYPE'. Not found.")})
-                @stream.queue += charStack
-                @state = @states[:bogusComment]
-            end
+          @tokenQueue.push({:type => :ParseError, :data =>
+            _("Expected '--' or 'DOCTYPE'. Not found.")})
+          @stream.queue += charStack
+          @state = @states[:bogusComment]
         end
-        return true
+      end
+      return true
     end
 
     def commentState
-        data = @stream.char
-        if data == "-"
-            @state = @states[:commentDash]
-        elsif data == :EOF
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file in comment.")})
-            @tokenQueue.push(@currentToken)
-            @state = @states[:data]
-        else
-            @currentToken[:data] += data + @stream.charsUntil("-")
-        end
-        return true
+      data = @stream.char
+      if data == "-"
+        @state = @states[:commentDash]
+      elsif data == :EOF
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file in comment.")})
+        @tokenQueue.push(@currentToken)
+        @state = @states[:data]
+      else
+        @currentToken[:data] += data + @stream.chars_until("-")
+      end
+      return true
     end
 
     def commentDashState
-        data = @stream.char
-        if data == "-"
-            @state = @states[:commentEnd]
-        elsif data == :EOF
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file in comment (-)")})
-            @tokenQueue.push(@currentToken)
-            @state = @states[:data]
-        else
-            @currentToken[:data] += "-" + data +\
-              @stream.charsUntil("-")
-            # Consume the next character which is either a "-" or an :EOF as
-            # well so if there's a "-" directly after the "-" we go nicely to
-            # the "comment end state" without emitting a ParseError there.
-            @stream.char
-        end
-        return true
+      data = @stream.char
+      if data == "-"
+        @state = @states[:commentEnd]
+      elsif data == :EOF
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file in comment (-)")})
+        @tokenQueue.push(@currentToken)
+        @state = @states[:data]
+      else
+        @currentToken[:data] += "-" + data +\
+          @stream.chars_until("-")
+        # Consume the next character which is either a "-" or an :EOF as
+        # well so if there's a "-" directly after the "-" we go nicely to
+        # the "comment end state" without emitting a ParseError there.
+        @stream.char
+      end
+      return true
     end
 
     def commentEndState
-        data = @stream.char
-        if data == ">"
-            @tokenQueue.push(@currentToken)
-            @state = @states[:data]
-        elsif data == "-"
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected '-' after '--' found in comment.")})
-            @currentToken[:data] += data
-        elsif data == :EOF
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file in comment (--).")})
-            @tokenQueue.push(@currentToken)
-            @state = @states[:data]
-        else
-            # XXX
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected character in comment found.")})
-            @currentToken[:data] += "--" + data
-            @state = @states[:comment]
-        end
-        return true
+      data = @stream.char
+      if data == ">"
+        @tokenQueue.push(@currentToken)
+        @state = @states[:data]
+      elsif data == "-"
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected '-' after '--' found in comment.")})
+        @currentToken[:data] += data
+      elsif data == :EOF
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file in comment (--).")})
+        @tokenQueue.push(@currentToken)
+        @state = @states[:data]
+      else
+        # XXX
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected character in comment found.")})
+        @currentToken[:data] += "--" + data
+        @state = @states[:comment]
+      end
+      return true
     end
 
     def doctypeState
-        data = @stream.char
-        if SPACE_CHARACTERS.include? data
-            @state = @states[:beforeDoctypeName]
-        else
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("No space after literal string 'DOCTYPE'.")})
-            @stream.queue.push(data)
-            @state = @states[:beforeDoctypeName]
-        end
-        return true
+      data = @stream.char
+      if SPACE_CHARACTERS.include? data
+        @state = @states[:beforeDoctypeName]
+      else
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("No space after literal string 'DOCTYPE'.")})
+        @stream.queue.push(data)
+        @state = @states[:beforeDoctypeName]
+      end
+      return true
     end
 
     def beforeDoctypeNameState
-        data = @stream.char
-        if SPACE_CHARACTERS.include? data
-        elsif ASCII_LOWERCASE.include? data
-            @currentToken[:name] = data.upcase
-            @state = @states[:doctypeName]
-        elsif data == ">"
-            # Character needs to be consumed per the specification so don't
-            # invoke emitCurrentTokenWithParseError with :data as argument.
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected > character. Expected DOCTYPE name.")})
-            @tokenQueue.push(@currentToken)
-            @state = @states[:data]
-        elsif data == :EOF
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file. Expected DOCTYPE name.")})
-            @tokenQueue.push(@currentToken)
-            @state = @states[:data]
-        else
-            @currentToken[:name] = data
-            @state = @states[:doctypeName]
-        end
-        return true
+      data = @stream.char
+      if SPACE_CHARACTERS.include? data
+      elsif ASCII_LOWERCASE.include? data
+        @currentToken[:name] = data.upcase
+        @state = @states[:doctypeName]
+      elsif data == ">"
+        # Character needs to be consumed per the specification so don't
+        # invoke emitCurrentTokenWithParseError with :data as argument.
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected > character. Expected DOCTYPE name.")})
+        @tokenQueue.push(@currentToken)
+        @state = @states[:data]
+      elsif data == :EOF
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file. Expected DOCTYPE name.")})
+        @tokenQueue.push(@currentToken)
+        @state = @states[:data]
+      else
+        @currentToken[:name] = data
+        @state = @states[:doctypeName]
+      end
+      return true
     end
 
     def doctypeNameState
-        data = @stream.char
-        needsDoctypeCheck = false
-        if SPACE_CHARACTERS.include? data
-            @state = @states[:afterDoctypeName]
-            needsDoctypeCheck = true
-        elsif data == ">"
-            @tokenQueue.push(@currentToken)
-            @state = @states[:data]
-        elsif data == :EOF
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file in DOCTYPE name.")})
-            @tokenQueue.push(@currentToken)
-            @state = @states[:data]
-        else
-            # We can't just uppercase everything that arrives here. For
-            # instance, non-ASCII characters.
-            if ASCII_LOWERCASE.include? data
-                data = data.upcase
-            end
-            @currentToken[:name] += data
-            needsDoctypeCheck = true
+      data = @stream.char
+      needsDoctypeCheck = false
+      if SPACE_CHARACTERS.include? data
+        @state = @states[:afterDoctypeName]
+        needsDoctypeCheck = true
+      elsif data == ">"
+        @tokenQueue.push(@currentToken)
+        @state = @states[:data]
+      elsif data == :EOF
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file in DOCTYPE name.")})
+        @tokenQueue.push(@currentToken)
+        @state = @states[:data]
+      else
+        # We can't just uppercase everything that arrives here. For
+        # instance, non-ASCII characters.
+        if ASCII_LOWERCASE.include? data
+          data = data.upcase
         end
+        @currentToken[:name] += data
+        needsDoctypeCheck = true
+      end
 
-        # After some iterations through this state it should eventually say
-        # "HTML". Otherwise there's an error.
-        if needsDoctypeCheck and @currentToken[:name] == "HTML"
-            @currentToken[:data] = false
-        end
-        return true
+      # After some iterations through this state it should eventually say
+      # "HTML". Otherwise there's an error.
+      if needsDoctypeCheck and @currentToken[:name] == "HTML"
+        @currentToken[:data] = false
+      end
+      return true
     end
 
     def afterDoctypeNameState
-        data = @stream.char
-        if SPACE_CHARACTERS.include? data
-        elsif data == ">"
-            @tokenQueue.push(@currentToken)
-            @state = @states[:data]
-        elsif data == :EOF
-            @currentToken[:data] = true
-            # XXX EMIT
-            @stream.queue.push(data)
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file in DOCTYPE.")})
-            @tokenQueue.push(@currentToken)
-            @state = @states[:data]
-        else
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Expected space or '>'. Got '" + data + "'")})
-            @currentToken[:data] = true
-            @state = @states[:bogusDoctype]
-        end
-        return true
+      data = @stream.char
+      if SPACE_CHARACTERS.include? data
+      elsif data == ">"
+        @tokenQueue.push(@currentToken)
+        @state = @states[:data]
+      elsif data == :EOF
+        @currentToken[:data] = true
+        # XXX EMIT
+        @stream.queue.push(data)
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file in DOCTYPE.")})
+        @tokenQueue.push(@currentToken)
+        @state = @states[:data]
+      else
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Expected space or '>'. Got '" + data + "'")})
+        @currentToken[:data] = true
+        @state = @states[:bogusDoctype]
+      end
+      return true
     end
 
     def bogusDoctypeState
-        data = @stream.char
-        if data == ">"
-            @tokenQueue.push(@currentToken)
-            @state = @states[:data]
-        elsif data == :EOF
-            # XXX EMIT
-            @stream.queue.push(data)
-            @tokenQueue.push({:type => :ParseError, :data =>
-              _("Unexpected end of file in bogus doctype.")})
-            @tokenQueue.push(@currentToken)
-            @state = @states[:data]
-        end
-        return true
+      data = @stream.char
+      if data == ">"
+        @tokenQueue.push(@currentToken)
+        @state = @states[:data]
+      elsif data == :EOF
+        # XXX EMIT
+        @stream.queue.push(data)
+        @tokenQueue.push({:type => :ParseError, :data =>
+          _("Unexpected end of file in bogus doctype.")})
+        @tokenQueue.push(@currentToken)
+        @state = @states[:data]
+      end
+      return true
     end
 
     def _(string); string; end
-end
+  end
 
 end
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/treebuilders.rb b/vendor/plugins/HTML5lib/lib/html5lib/treebuilders.rb
index 838ddc71..176b402a 100644
--- a/vendor/plugins/HTML5lib/lib/html5lib/treebuilders.rb
+++ b/vendor/plugins/HTML5lib/lib/html5lib/treebuilders.rb
@@ -1,21 +1,21 @@
 module HTML5lib
-module TreeBuilders
+  module TreeBuilders
 
-  def self.getTreeBuilder(name)
-    case name.to_s.downcase
+    def self.getTreeBuilder(name)
+      case name.to_s.downcase
         when 'simpletree' then
-            require 'html5lib/treebuilders/simpletree'
-            SimpleTree::TreeBuilder
+          require 'html5lib/treebuilders/simpletree'
+          SimpleTree::TreeBuilder
         when 'rexml' then
-            require 'html5lib/treebuilders/rexml'
-            REXMLTree::TreeBuilder
+          require 'html5lib/treebuilders/rexml'
+          REXMLTree::TreeBuilder
         when 'hpricot' then
-            require 'html5lib/treebuilders/hpricot'
-            Hpricot::TreeBuilder
+          require 'html5lib/treebuilders/hpricot'
+          Hpricot::TreeBuilder
         else
-            raise "Unknown TreeBuilder #{name}"
+          raise "Unknown TreeBuilder #{name}"
+      end
     end
-  end
 
-end
+  end
 end
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/base.rb b/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/base.rb
index 3f1f914f..5c1be892 100755
--- a/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/base.rb
+++ b/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/base.rb
@@ -4,166 +4,166 @@ require 'html5lib/constants'
 
 module HTML5lib
 
-# The scope markers are inserted when entering buttons, object elements,
-# marquees, table cells, and table captions, and are used to prevent formatting
-# from "leaking" into tables, buttons, object elements, and marquees.
-Marker = nil
+  # The scope markers are inserted when entering buttons, object elements,
+  # marquees, table cells, and table captions, and are used to prevent formatting
+  # from "leaking" into tables, buttons, object elements, and marquees.
+  Marker = nil
 
-module TreeBuilders
-module Base
+  module TreeBuilders
+    module Base
 
-class Node
-    # The parent of the current node (or nil for the document node)
-    attr_accessor :parent
+      class Node
+        # The parent of the current node (or nil for the document node)
+        attr_accessor :parent
 
-    # a list of child nodes of the current node. This must 
-    # include all elements but not necessarily other node types
-    attr_accessor :childNodes
+        # a list of child nodes of the current node. This must 
+        # include all elements but not necessarily other node types
+        attr_accessor :childNodes
 
-    # A list of miscellaneous flags that can be set on the node
-    attr_accessor :_flags
+        # A list of miscellaneous flags that can be set on the node
+        attr_accessor :_flags
 
-    def initialize(name)
-        @parent = nil
-        @childNodes = []
-        @_flags = []
-    end
-
-    # Insert node as a child of the current node
-    def appendChild(node)
-        raise NotImplementedError
-    end
-
-    # Insert data as text in the current node, positioned before the 
-    # start of node insertBefore or to the end of the node's text.
-    def insertText(data, insertBefore = nil)
-        raise NotImplementedError
-    end
-
-    # Insert node as a child of the current node, before refNode in the 
-    # list of child nodes. Raises ValueError if refNode is not a child of 
-    # the current node
-    def insertBefore(node, refNode)
-        raise NotImplementedError
-    end
-
-    # Remove node from the children of the current node
-    def removeChild(node)
-        raise NotImplementedError
-    end
-
-    # Move all the children of the current node to newParent. 
-    # This is needed so that trees that don't store text as nodes move the 
-    # text in the correct way
-    def reparentChildren(newParent)
-        #XXX - should this method be made more general?
-        @childNodes.each { |child| newParent.appendChild(child) }
-        @childNodes = []
-    end
-
-    # Return a shallow copy of the current node i.e. a node with the same
-    # name and attributes but with no parent or child nodes
-    def cloneNode
-        raise NotImplementedError
-    end
-
-    # Return true if the node has children or text, false otherwise
-    def hasContent
-        raise NotImplementedError
-    end
-end
-
-# Base treebuilder implementation
-class TreeBuilder
-
-    attr_accessor :openElements
-
-    attr_accessor :activeFormattingElements
-
-    attr_accessor :document
-
-    attr_accessor :headPointer
-
-    attr_accessor :formPointer
-
-    # Class to use for document root
-    documentClass = nil
-
-    # Class to use for HTML elements
-    elementClass = nil
-
-    # Class to use for comments
-    commentClass = nil
-
-    # Class to use for doctypes
-    doctypeClass = nil
-    
-    # Fragment class
-    fragmentClass = nil
-
-    def initialize
-        reset
-    end
-    
-    def reset
-        @openElements = []
-        @activeFormattingElements = []
-
-        #XXX - rename these to headElement, formElement
-        @headPointer = nil
-        @formPointer = nil
-
-        self.insertFromTable = false
-
-        @document = @documentClass.new
-    end
-
-    def elementInScope(target, tableVariant = false)
-        # Exit early when possible.
-        return true if @openElements[-1].name == target
-
-        # AT How about while true and simply set node to [-1] and set it to
-        # [-2] at the end...
-        @openElements.reverse.each do |element|
-            if element.name == target
-                return true
-            elsif element.name == 'table'
-                return false
-            elsif not tableVariant and SCOPING_ELEMENTS.include?(element.name)
-                return false
-            elsif element.name == 'html'
-                return false
-            end
+        def initialize(name)
+          @parent = nil
+          @childNodes = []
+          @_flags = []
         end
-        assert false # We should never reach this point
-    end
 
-    def reconstructActiveFormattingElements
-        # Within this algorithm the order of steps described in the
-        # specification is not quite the same as the order of steps in the
-        # code. It should still do the same though.
+        # Insert node as a child of the current node
+        def appendChild(node)
+          raise NotImplementedError
+        end
 
-        # Step 1: stop the algorithm when there's nothing to do.
-        return unless @activeFormattingElements
+        # Insert data as text in the current node, positioned before the 
+        # start of node insertBefore or to the end of the node's text.
+        def insertText(data, insertBefore=nil)
+          raise NotImplementedError
+        end
 
-        # Step 2 and step 3: we start with the last element. So i is -1.
-        i = -1
-        entry = @activeFormattingElements[i]
-        return if entry == Marker or @openElements.include?(entry)
+        # Insert node as a child of the current node, before refNode in the 
+        # list of child nodes. Raises ValueError if refNode is not a child of 
+        # the current node
+        def insertBefore(node, refNode)
+          raise NotImplementedError
+        end
 
-        # Step 6
-        until entry == Marker or @openElements.include?(entry)
+        # Remove node from the children of the current node
+        def removeChild(node)
+          raise NotImplementedError
+        end
+
+        # Move all the children of the current node to newParent. 
+        # This is needed so that trees that don't store text as nodes move the 
+        # text in the correct way
+        def reparentChildren(newParent)
+          #XXX - should this method be made more general?
+          @childNodes.each { |child| newParent.appendChild(child) }
+          @childNodes = []
+        end
+
+        # Return a shallow copy of the current node i.e. a node with the same
+        # name and attributes but with no parent or child nodes
+        def cloneNode
+          raise NotImplementedError
+        end
+
+        # Return true if the node has children or text, false otherwise
+        def hasContent
+          raise NotImplementedError
+        end
+      end
+
+      # Base treebuilder implementation
+      class TreeBuilder
+
+        attr_accessor :openElements
+
+        attr_accessor :activeFormattingElements
+
+        attr_accessor :document
+
+        attr_accessor :headPointer
+
+        attr_accessor :formPointer
+
+        # Class to use for document root
+        documentClass = nil
+
+        # Class to use for HTML elements
+        elementClass = nil
+
+        # Class to use for comments
+        commentClass = nil
+
+        # Class to use for doctypes
+        doctypeClass = nil
+
+        # Fragment class
+        fragmentClass = nil
+
+        def initialize
+          reset
+        end
+
+        def reset
+          @openElements = []
+          @activeFormattingElements = []
+
+          #XXX - rename these to headElement, formElement
+          @headPointer = nil
+          @formPointer = nil
+
+          self.insertFromTable = false
+
+          @document = @documentClass.new
+        end
+
+        def elementInScope(target, tableVariant=false)
+          # Exit early when possible.
+          return true if @openElements[-1].name == target
+
+          # AT How about while true and simply set node to [-1] and set it to
+          # [-2] at the end...
+          @openElements.reverse.each do |element|
+            if element.name == target
+              return true
+            elsif element.name == 'table'
+              return false
+            elsif not tableVariant and SCOPING_ELEMENTS.include?(element.name)
+              return false
+            elsif element.name == 'html'
+              return false
+            end
+          end
+          assert false # We should never reach this point
+        end
+
+        def reconstructActiveFormattingElements
+          # Within this algorithm the order of steps described in the
+          # specification is not quite the same as the order of steps in the
+          # code. It should still do the same though.
+
+          # Step 1: stop the algorithm when there's nothing to do.
+          return unless @activeFormattingElements
+
+          # Step 2 and step 3: we start with the last element. So i is -1.
+          i = -1
+          entry = @activeFormattingElements[i]
+          return if entry == Marker or @openElements.include?(entry)
+
+          # Step 6
+          until entry == Marker or @openElements.include?(entry)
             # Step 5: let entry be one earlier in the list.
             i -= 1
             begin
-                entry = @activeFormattingElements[i]
+              entry = @activeFormattingElements[i]
             rescue
-                # Step 4: at this point we need to jump to step 8. By not doing
-                # i += 1 which is also done in step 7 we achieve that.
-                break
+              # Step 4: at this point we need to jump to step 8. By not doing
+              # i += 1 which is also done in step 7 we achieve that.
+              break
             end
-        end
-        while true
+          end
+          while true
             # Step 7
             i += 1
 
@@ -178,153 +178,153 @@ class TreeBuilder
 
             # Step 11
             break if element == @activeFormattingElements[-1]
+          end
         end
-    end
 
-    def clearActiveFormattingElements
-        {} until @activeFormattingElements.empty? || @activeFormattingElements.pop == Marker
-    end
+        def clearActiveFormattingElements
+          {} until @activeFormattingElements.empty? || @activeFormattingElements.pop == Marker
+        end
 
-    # Check if an element exists between the end of the active
-    # formatting elements and the last marker. If it does, return it, else
-    # return false
-    def elementInActiveFormattingElements(name)
-        @activeFormattingElements.reverse.each do |element|
+        # Check if an element exists between the end of the active
+        # formatting elements and the last marker. If it does, return it, else
+        # return false
+        def elementInActiveFormattingElements(name)
+          @activeFormattingElements.reverse.each do |element|
             # Check for Marker first because if it's a Marker it doesn't have a
             # name attribute.
             break if element == Marker
             return element if element.name == name
+          end
+          return false
         end
-        return false
-    end
 
-    def insertDoctype(name)
-        @document.appendChild(@doctypeClass.new(name))
-    end
+        def insertDoctype(name)
+          @document.appendChild(@doctypeClass.new(name))
+        end
 
-    def insertComment(data, parent = nil)
-        parent = @openElements[-1] if parent.nil?
-        parent.appendChild(@commentClass.new(data))
-    end
-                           
-    # Create an element but don't insert it anywhere
-    def createElement(name, attributes)
-        element = @elementClass.new(name)
-        element.attributes = attributes
-        return element
-    end
+        def insertComment(data, parent=nil)
+          parent = @openElements[-1] if parent.nil?
+          parent.appendChild(@commentClass.new(data))
+        end
+               
+        # Create an element but don't insert it anywhere
+        def createElement(name, attributes)
+          element = @elementClass.new(name)
+          element.attributes = attributes
+          return element
+        end
 
-    # Switch the function used to insert an element from the
-    # normal one to the misnested table one and back again
-    def insertFromTable=(value)
-        @insertFromTable = value
-        @insertElement = value ? :insertElementTable : :insertElementNormal
-    end
+        # Switch the function used to insert an element from the
+        # normal one to the misnested table one and back again
+        def insertFromTable=(value)
+          @insertFromTable = value
+          @insertElement = value ? :insertElementTable : :insertElementNormal
+        end
 
-    def insertElement(name, attributes)
-        send(@insertElement, name, attributes)
-    end
+        def insertElement(name, attributes)
+          send(@insertElement, name, attributes)
+        end
 
-    def insertElementNormal(name, attributes)
-        element = @elementClass.new(name)
-        element.attributes = attributes
-        @openElements[-1].appendChild(element)
-        @openElements.push(element)
-        return element
-    end
+        def insertElementNormal(name, attributes)
+          element = @elementClass.new(name)
+          element.attributes = attributes
+          @openElements[-1].appendChild(element)
+          @openElements.push(element)
+          return element
+        end
 
-    # Create an element and insert it into the tree
-    def insertElementTable(name, attributes)
-        element = @elementClass.new(name)
-        element.attributes = attributes
-        if TABLE_INSERT_MODE_ELEMENTS.include?(@openElements[-1].name)
+        # Create an element and insert it into the tree
+        def insertElementTable(name, attributes)
+          element = @elementClass.new(name)
+          element.attributes = attributes
+          if TABLE_INSERT_MODE_ELEMENTS.include?(@openElements[-1].name)
             #We should be in the InTable mode. This means we want to do
             #special magic element rearranging
             parent, insertBefore = getTableMisnestedNodePosition
             if insertBefore.nil?
-                parent.appendChild(element)
+              parent.appendChild(element)
             else
-                parent.insertBefore(element, insertBefore)
+              parent.insertBefore(element, insertBefore)
             end
             @openElements.push(element)
-        else
+          else
             return insertElementNormal(name, attributes)
+          end
+          return element
         end
-        return element
-    end
 
-    def insertText(data, parent = nil)
-        parent = @openElements[-1] if parent.nil?
+        def insertText(data, parent=nil)
+          parent = @openElements[-1] if parent.nil?
 
-        if (not(@insertFromTable) or (@insertFromTable and not TABLE_INSERT_MODE_ELEMENTS.include?(@openElements[-1].name)))
+          if (not(@insertFromTable) or (@insertFromTable and not TABLE_INSERT_MODE_ELEMENTS.include?(@openElements[-1].name)))
             parent.insertText(data)
-        else
+          else
             #We should be in the InTable mode. This means we want to do
             #special magic element rearranging
             parent, insertBefore = getTableMisnestedNodePosition
             parent.insertText(data, insertBefore)
+          end
         end
-    end
-            
-    # Get the foster parent element, and sibling to insert before
-    # (or nil) when inserting a misnested table node
-    def getTableMisnestedNodePosition
-        #The foster parent element is the one which comes before the most
-        #recently opened table element
-        #XXX - this is really inelegant
-        lastTable = nil
-        fosterParent = nil
-        insertBefore = nil
-        @openElements.reverse.each do |element|
+      
+        # Get the foster parent element, and sibling to insert before
+        # (or nil) when inserting a misnested table node
+        def getTableMisnestedNodePosition
+          #The foster parent element is the one which comes before the most
+          #recently opened table element
+          #XXX - this is really inelegant
+          lastTable = nil
+          fosterParent = nil
+          insertBefore = nil
+          @openElements.reverse.each do |element|
             if element.name == "table"
-                lastTable = element
-                break
+              lastTable = element
+              break
             end
-        end
-        if lastTable
+          end
+          if lastTable
             #XXX - we should really check that this parent is actually a
             #node here
             if lastTable.parent
-                fosterParent = lastTable.parent
-                insertBefore = lastTable
+              fosterParent = lastTable.parent
+              insertBefore = lastTable
             else
-                fosterParent = @openElements[@openElements.index(lastTable) - 1]
+              fosterParent = @openElements[@openElements.index(lastTable) - 1]
             end
-        else
+          else
             fosterParent = @openElements[0]
+          end
+          return fosterParent, insertBefore
         end
-        return fosterParent, insertBefore
-    end
 
-    def generateImpliedEndTags(exclude = nil)
-        name = @openElements[-1].name
+        def generateImpliedEndTags(exclude=nil)
+          name = @openElements[-1].name
 
-        if (['dd', 'dt', 'li', 'p', 'td', 'th', 'tr'].include?(name) and name != exclude)
+          if (['dd', 'dt', 'li', 'p', 'td', 'th', 'tr'].include?(name) and name != exclude)
             @openElements.pop
             # XXX This is not entirely what the specification says. We should
             # investigate it more closely.
             generateImpliedEndTags(exclude)
+          end
         end
-    end
 
-    def getDocument
-        @document
-    end
-    
-    def getFragment
-        #assert @innerHTML
-        fragment = @fragmentClass.new
-        @openElements[0].reparentChildren(fragment)
-        return fragment
-    end
+        def getDocument
+          @document
+        end
+  
+        def getFragment
+          #assert @innerHTML
+          fragment = @fragmentClass.new
+          @openElements[0].reparentChildren(fragment)
+          return fragment
+        end
 
-    # Serialize the subtree of node in the format required by unit tests
-    # node - the node from which to start serializing
-    def testSerializer(node)
-        raise NotImplementedError
-    end
+        # Serialize the subtree of node in the format required by unit tests
+        # node - the node from which to start serializing
+        def testSerializer(node)
+          raise NotImplementedError
+        end
 
-end
-end
-end
+      end
+    end
+  end
 end
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/hpricot.rb b/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/hpricot.rb
index f3cba33b..3ea8afa2 100644
--- a/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/hpricot.rb
+++ b/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/hpricot.rb
@@ -3,209 +3,212 @@ require 'hpricot'
 require 'forwardable'
 
 module HTML5lib
-module TreeBuilders
-module Hpricot
+  module TreeBuilders
+    module Hpricot
 
-class Node < Base::Node
+      class Node < Base::Node
 
-    extend Forwardable
+        extend Forwardable
 
-    def_delegators :@hpricot, :name
+        def_delegators :@hpricot, :name
 
-    attr_accessor :hpricot
+        attr_accessor :hpricot
 
-    def initialize(name)
-        super(name)
-        @hpricot = self.class.hpricot_class.new name
-    end
+        def initialize(name)
+          super(name)
+          @hpricot = self.class.hpricot_class.new name
+        end
 
-    def appendChild(node)
-        if node.kind_of?(TextNode) and childNodes.any? and childNodes.last.kind_of?(TextNode)
+        def appendChild(node)
+          if node.kind_of?(TextNode) and childNodes.any? and childNodes.last.kind_of?(TextNode)
             childNodes[-1].hpricot.content = childNodes[-1].hpricot.to_s + node.hpricot.to_s
-        else
+          else
             childNodes << node
             hpricot.children << node.hpricot
+          end
+          node.parent = self
         end
-        node.parent = self
-    end
 
-    def removeChild(node)
-       childNodes.delete(node)
-       hpricot.children.delete_at(hpricot.children.index(node.hpricot))
-       node.parent = nil
-    end
+        def removeChild(node)
+           childNodes.delete(node)
+           hpricot.children.delete_at(hpricot.children.index(node.hpricot))
+           node.parent = nil
+        end
 
-    def insertText(data, before = nil)
-        if before
+        def insertText(data, before=nil)
+          if before
             insertBefore(TextNode.new(data), before)
-        else
+          else
             appendChild(TextNode.new(data))
+          end
         end
-    end
 
-    def insertBefore(node, refNode)
-        index = childNodes.index(refNode)
-        if node.kind_of?(TextNode) and index > 0 and childNodes[index-1].kind_of?(TextNode)
+        def insertBefore(node, refNode)
+          index = childNodes.index(refNode)
+          if node.kind_of?(TextNode) and index > 0 and childNodes[index-1].kind_of?(TextNode)
             childNodes[index-1].hpricot.content = childNodes[index-1].hpricot.to_s + node.hpricot.to_s
-        else
+          else
             childNodes.insert(index, node)
+          end
         end
-    end
 
-    def hasContent
-        childNodes.any?
-    end
-end
+        def hasContent
+          childNodes.any?
+        end
+      end
 
-class Element < Node
-    def self.hpricot_class
-        ::Hpricot::Elem
-    end
+      class Element < Node
+        def self.hpricot_class
+          ::Hpricot::Elem
+        end
 
-    def initialize(name)
-        super(name)
+        def initialize(name)
+          super(name)
 
-        @hpricot = ::Hpricot::Elem.new(::Hpricot::STag.new(name))
-    end
+          @hpricot = ::Hpricot::Elem.new(::Hpricot::STag.new(name))
+        end
 
-    def name
-        @hpricot.stag.name
-    end
+        def name
+          @hpricot.stag.name
+        end
 
-    def cloneNode
-        attributes.inject(self.class.new(name)) do |node, (name, value)|
+        def cloneNode
+          attributes.inject(self.class.new(name)) do |node, (name, value)|
             node.hpricot[name] = value
             node
+          end
         end
-    end
 
-    # A call to Hpricot::Elem#raw_attributes is built dynamically,
-    # so alterations to the returned value (a hash) will be lost.
-    #
-    # AttributeProxy works around this by forwarding :[]= calls
-    # to the raw_attributes accessor on the element start tag.
-    #
-    class AttributeProxy
-        def initialize(hpricot)
+        # A call to Hpricot::Elem#raw_attributes is built dynamically,
+        # so alterations to the returned value (a hash) will be lost.
+        #
+        # AttributeProxy works around this by forwarding :[]= calls
+        # to the raw_attributes accessor on the element start tag.
+        #
+        class AttributeProxy
+          def initialize(hpricot)
             @hpricot = hpricot
-        end
-        def []=(k, v)
+          end
+
+          def []=(k, v)
             @hpricot.stag.send(stag_attributes_method)[k] = v
-        end
-        def stag_attributes_method
+          end
+
+          def stag_attributes_method
             # STag#attributes changed to STag#raw_attributes after Hpricot 0.5
             @hpricot.stag.respond_to?(:raw_attributes) ? :raw_attributes : :attributes
-        end
-        def method_missing(*a, &b)
+          end
+
+          def method_missing(*a, &b)
             @hpricot.attributes.send(*a, &b)
+          end
         end
-    end
 
-    def attributes
-        AttributeProxy.new(@hpricot)
-    end
+        def attributes
+          AttributeProxy.new(@hpricot)
+        end
 
-    def attributes=(attrs)
-        attrs.each { |name, value| @hpricot[name] = value }
-    end
+        def attributes=(attrs)
+          attrs.each { |name, value| @hpricot[name] = value }
+        end
 
-    def printTree(indent = 0)
-        tree = "\n|#{' ' * indent}<#{name}>"
-        indent += 2
-        attributes.each do |name, value|
+        def printTree(indent=0)
+          tree = "\n|#{' ' * indent}<#{name}>"
+          indent += 2
+          attributes.each do |name, value|
             next if name == 'xmlns'
             tree += "\n|#{' ' * indent}#{name}=\"#{value}\""
+          end
+          childNodes.inject(tree) { |tree, child| tree + child.printTree(indent) }
         end
-        childNodes.inject(tree) { |tree, child| tree + child.printTree(indent) }
-    end
-end
+      end
 
-class Document < Node
-    def self.hpricot_class
-        ::Hpricot::Doc
-    end
+      class Document < Node
+        def self.hpricot_class
+          ::Hpricot::Doc
+        end
 
-    def initialize
-        super(nil)
-    end
+        def initialize
+          super(nil)
+        end
 
-    def printTree(indent = 0)
-        childNodes.inject('#document') { |tree, child| tree + child.printTree(indent + 2) }
-    end
-end
+        def printTree(indent=0)
+          childNodes.inject('#document') { |tree, child| tree + child.printTree(indent + 2) }
+        end
+      end
 
-class DocumentType < Node
-    def self.hpricot_class
-        ::Hpricot::DocType
-    end
+      class DocumentType < Node
+        def self.hpricot_class
+          ::Hpricot::DocType
+        end
 
-    def initialize(name)
-        begin
+        def initialize(name)
+          begin
             super(name)
-        rescue ArgumentError # needs 3...
+          rescue ArgumentError # needs 3...
+          end
+
+          @hpricot = ::Hpricot::DocType.new(name, nil, nil)
         end
 
-        @hpricot = ::Hpricot::DocType.new(name, nil, nil)
-    end
+        def printTree(indent=0)
+          "\n|#{' ' * indent}<!DOCTYPE #{hpricot.target}>"
+        end
+      end
+
+      class DocumentFragment < Element
+        def initialize
+          super('')
+        end
+
+        def printTree(indent=0)
+          childNodes.inject('') { |tree, child| tree + child.printTree(indent+2) }
+        end
+      end
+
+      class TextNode < Node
+        def initialize(data)
+          @hpricot = ::Hpricot::Text.new(data)
+        end
+
+        def printTree(indent=0)
+          "\n|#{' ' * indent}\"#{hpricot.content}\""
+        end
+      end
+
+      class CommentNode < Node
+        def self.hpricot_class
+          ::Hpricot::Comment
+        end
+
+        def printTree(indent=0)
+          "\n|#{' ' * indent}<!-- #{hpricot.content} -->"
+        end
+      end
+
+      class TreeBuilder < Base::TreeBuilder
+        def initialize
+          @documentClass = Document
+          @doctypeClass = DocumentType
+          @elementClass = Element
+          @commentClass = CommentNode
+          @fragmentClass = DocumentFragment
+        end
+
+        def testSerializer(node)
+          node.printTree
+        end
+
+        def getDocument
+          @document.hpricot
+        end
+
+        def getFragment
+          @document = super
+          return @document.hpricot.children
+        end
+      end
 
-    def printTree(indent = 0)
-        "\n|#{' ' * indent}<!DOCTYPE #{hpricot.target}>"
     end
-end
-
-class DocumentFragment < Element
-    def initialize
-        super('')
-    end
-
-    def printTree(indent = 0)
-        childNodes.inject('') { |tree, child| tree + child.printTree(indent+2) }
-    end
-end
-
-class TextNode < Node
-    def initialize(data)
-        @hpricot = ::Hpricot::Text.new(data)
-    end
-
-    def printTree(indent = 0)
-        "\n|#{' ' * indent}\"#{hpricot.content}\""
-    end
-end
-
-class CommentNode < Node
-    def self.hpricot_class
-        ::Hpricot::Comment
-    end
-
-    def printTree(indent = 0)
-        "\n|#{' ' * indent}<!-- #{hpricot.content} -->"
-    end
-end
-
-class TreeBuilder < Base::TreeBuilder
-    def initialize
-        @documentClass = Document
-        @doctypeClass = DocumentType
-        @elementClass = Element
-        @commentClass = CommentNode
-        @fragmentClass = DocumentFragment
-    end
-
-    def testSerializer(node)
-        node.printTree
-    end
-
-    def getDocument
-        @document.hpricot
-    end
-
-    def getFragment
-        @document = super
-        return @document.hpricot.children
-    end
-end
-
-end
-end
+  end
 end
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/rexml.rb b/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/rexml.rb
index 66886545..7c389ca6 100644
--- a/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/rexml.rb
+++ b/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/rexml.rb
@@ -3,189 +3,189 @@ require 'rexml/document'
 require 'forwardable'
 
 module HTML5lib
-module TreeBuilders
-module REXMLTree
+  module TreeBuilders
+    module REXMLTree
 
-class Node < Base::Node
-    extend Forwardable
-    def_delegators :@rxobj, :name, :attributes
-    attr_accessor :rxobj
+      class Node < Base::Node
+        extend Forwardable
+        def_delegators :@rxobj, :name, :attributes
+        attr_accessor :rxobj
 
-    def initialize name
-        super name
-        @rxobj = self.class.rxclass.new name
-    end
+        def initialize name
+          super name
+          @rxobj = self.class.rxclass.new name
+        end
 
-    def appendChild node
-        if node.kind_of? TextNode and 
-          childNodes.length>0 and childNodes[-1].kind_of? TextNode
+        def appendChild node
+          if node.kind_of? TextNode and 
+            childNodes.length>0 and childNodes[-1].kind_of? TextNode
             childNodes[-1].rxobj.value =
               childNodes[-1].rxobj.to_s + node.rxobj.to_s
             childNodes[-1].rxobj.raw = true
-        else
+          else
             childNodes.push node
             rxobj.add node.rxobj
+          end
+          node.parent = self
         end
-        node.parent = self
-    end
 
-    def removeChild node
-       childNodes.delete node
-       rxobj.delete node.rxobj
-       node.parent = nil
-    end
+        def removeChild node
+           childNodes.delete node
+           rxobj.delete node.rxobj
+           node.parent = nil
+        end
 
-    def insertText data, before=nil
-        if before
+        def insertText data, before=nil
+          if before
             insertBefore TextNode.new(data), before
-        else
+          else
             appendChild TextNode.new(data)
+          end
         end
-    end
 
-    def insertBefore node, refNode
-        index = childNodes.index(refNode)
-        if node.kind_of? TextNode and index>0 and 
-          childNodes[index-1].kind_of? TextNode
+        def insertBefore node, refNode
+          index = childNodes.index(refNode)
+          if node.kind_of? TextNode and index>0 and 
+            childNodes[index-1].kind_of? TextNode
             childNodes[index-1].rxobj.value =
               childNodes[index-1].rxobj.to_s + node.rxobj.to_s
             childNodes[index-1].rxobj.raw = true
-        else
+          else
             childNodes.insert index, node
+          end
         end
-    end
 
-    def hasContent
-        return (childNodes.length > 0)
-    end
-end
+        def hasContent
+          return (childNodes.length > 0)
+        end
+      end
 
-class Element < Node
-    def self.rxclass
-        REXML::Element
-    end
+      class Element < Node
+        def self.rxclass
+          REXML::Element
+        end
 
-    def initialize name
-        super name
-    end
+        def initialize name
+          super name
+        end
 
-    def cloneNode
-        newNode = self.class.new name
-        attributes.each {|name,value| newNode.attributes[name] = value}
-        newNode
-    end
+        def cloneNode
+          newNode = self.class.new name
+          attributes.each {|name,value| newNode.attributes[name] = value}
+          newNode
+        end
 
-    def attributes= value
-        value.each {|name,value| rxobj.attributes[name]=value}
-    end
+        def attributes= value
+          value.each {|name, value| rxobj.attributes[name]=value}
+        end
 
-    def printTree indent=0
-        tree = "\n|#{' ' * indent}<#{name}>"
-        indent += 2
-        for name, value in attributes
+        def printTree indent=0
+          tree = "\n|#{' ' * indent}<#{name}>"
+          indent += 2
+          for name, value in attributes
             next if name == 'xmlns'
             tree += "\n|#{' ' * indent}#{name}=\"#{value}\""
-        end
-        for child in childNodes
+          end
+          for child in childNodes
             tree += child.printTree(indent)
+          end
+          return tree
         end
-        return tree
-    end
-end
+      end
 
-class Document < Node
-    def self.rxclass
-        REXML::Document
-    end
+      class Document < Node
+        def self.rxclass
+          REXML::Document
+        end
 
-    def initialize
-        super nil
-    end
+        def initialize
+          super nil
+        end
 
-    def appendChild node
-       if node.kind_of? Element and node.name == 'html'
-           node.rxobj.add_namespace('http://www.w3.org/1999/xhtml')
-       end
-       super node
-    end
+        def appendChild node
+           if node.kind_of? Element and node.name == 'html'
+             node.rxobj.add_namespace('http://www.w3.org/1999/xhtml')
+           end
+           super node
+        end
 
-    def printTree indent=0
-        tree = "#document"
-        for child in childNodes
+        def printTree indent=0
+          tree = "#document"
+          for child in childNodes
             tree += child.printTree(indent + 2)
+          end
+          return tree
         end
-        return tree
-    end
-end
+      end
 
-class DocumentType < Node
-    def self.rxclass
-        REXML::DocType
-    end
+      class DocumentType < Node
+        def self.rxclass
+          REXML::DocType
+        end
 
-    def printTree indent=0
-        "\n|#{' ' * indent}<!DOCTYPE #{name}>"
-    end
-end
+        def printTree indent=0
+          "\n|#{' ' * indent}<!DOCTYPE #{name}>"
+        end
+      end
 
-class DocumentFragment < Element
-    def initialize
-        super nil
-    end
+      class DocumentFragment < Element
+        def initialize
+          super nil
+        end
 
-    def printTree indent=0
-        tree = ""
-        for child in childNodes
+        def printTree indent=0
+          tree = ""
+          for child in childNodes
             tree += child.printTree(indent+2)
+          end
+          return tree
         end
-        return tree
+      end
+
+      class TextNode < Node
+        def initialize data
+          raw=data.gsub('&','&amp;').gsub('<','&lt;').gsub('>','&gt;')
+          @rxobj = REXML::Text.new(raw, true, nil, true)
+        end
+
+        def printTree indent=0
+          "\n|#{' ' * indent}\"#{rxobj.value}\""
+        end
+      end
+
+      class CommentNode < Node
+        def self.rxclass
+          REXML::Comment
+        end
+
+        def printTree indent=0
+          "\n|#{' ' * indent}<!-- #{rxobj.string} -->"
+        end
+      end
+
+      class TreeBuilder < Base::TreeBuilder
+        def initialize
+          @documentClass = Document
+          @doctypeClass = DocumentType
+          @elementClass = Element
+          @commentClass = CommentNode
+          @fragmentClass = DocumentFragment
+        end
+
+        def testSerializer node
+          node.printTree()
+        end
+
+        def getDocument
+          @document.rxobj
+        end
+
+        def getFragment
+          @document = super
+          return @document.rxobj.children
+        end
+      end
+
     end
-end
-
-class TextNode < Node
-    def initialize data
-        raw=data.gsub('&','&amp;').gsub('<','&lt;').gsub('>','&gt;')
-        @rxobj = REXML::Text.new(raw, true, nil, true)
-    end
-
-    def printTree indent=0
-        "\n|#{' ' * indent}\"#{rxobj.value}\""
-    end
-end
-
-class CommentNode < Node
-    def self.rxclass
-        REXML::Comment
-    end
-
-    def printTree indent=0
-        "\n|#{' ' * indent}<!-- #{rxobj.string} -->"
-    end
-end
-
-class TreeBuilder < Base::TreeBuilder
-    def initialize
-        @documentClass = Document
-        @doctypeClass = DocumentType
-        @elementClass = Element
-        @commentClass = CommentNode
-        @fragmentClass = DocumentFragment
-    end
-
-    def testSerializer node
-        node.printTree()
-    end
-
-    def getDocument
-        @document.rxobj
-    end
-
-    def getFragment
-        @document = super
-        return @document.rxobj.children
-    end
-end
-
-end
-end
+  end
 end
diff --git a/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/simpletree.rb b/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/simpletree.rb
index 71379ec7..ff4d8f5d 100644
--- a/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/simpletree.rb
+++ b/vendor/plugins/HTML5lib/lib/html5lib/treebuilders/simpletree.rb
@@ -1,178 +1,178 @@
 require 'html5lib/treebuilders/base'
 
 module HTML5lib
-module TreeBuilders
-module SimpleTree
+  module TreeBuilders
+    module SimpleTree
 
-class Node < Base::Node
-    # Node representing an item in the tree.
-    # name - The tag name associated with the node
-    attr_accessor :name
+      class Node < Base::Node
+        # Node representing an item in the tree.
+        # name - The tag name associated with the node
+        attr_accessor :name
 
-    # The value of the current node (applies to text nodes and 
-    # comments
-    attr_accessor :value
+        # The value of the current node (applies to text nodes and 
+        # comments
+        attr_accessor :value
 
-    # a dict holding name, value pairs for attributes of the node
-    attr_accessor :attributes
+        # a dict holding name, value pairs for attributes of the node
+        attr_accessor :attributes
 
-    def initialize name
-        super
-        @name = name
-        @value = nil
-        @attributes = {}
-    end
+        def initialize name
+          super
+          @name = name
+          @value = nil
+          @attributes = {}
+        end
 
-    def appendChild node
-        if node.kind_of? TextNode and 
-          childNodes.length>0 and childNodes[-1].kind_of? TextNode
+        def appendChild node
+          if node.kind_of? TextNode and 
+            childNodes.length>0 and childNodes[-1].kind_of? TextNode
             childNodes[-1].value += node.value
-        else
+          else
             childNodes.push node
+          end
+          node.parent = self
         end
-        node.parent = self
-    end
 
-    def removeChild node
-       childNodes.delete node
-       node.parent = nil
-    end
+        def removeChild node
+           childNodes.delete node
+           node.parent = nil
+        end
 
-    def cloneNode
-        newNode = self.class.new name
-        attributes.each {|name,value| newNode.attributes[name] = value}
-        newNode.value = value
-        newNode
-    end
+        def cloneNode
+          newNode = self.class.new name
+          attributes.each {|name,value| newNode.attributes[name] = value}
+          newNode.value = value
+          newNode
+        end
 
-    def insertText data, before=nil
-        if before
+        def insertText data, before=nil
+          if before
             insertBefore TextNode.new(data), before
-        else
+          else
             appendChild TextNode.new(data)
+          end
         end
-    end
 
-    def insertBefore node, refNode
-        index = childNodes.index(refNode)
-        if node.kind_of? TextNode and index>0 and 
-          childNodes[index-1].kind_of? TextNode
+        def insertBefore node, refNode
+          index = childNodes.index(refNode)
+          if node.kind_of? TextNode and index>0 and 
+            childNodes[index-1].kind_of? TextNode
             childNodes[index-1].value += node.value
-        else
+          else
             childNodes.insert index, node
+          end
         end
-    end
 
-    def printTree indent=0
-        tree = "\n|%s%s" % [' '* indent, self.to_s]
-        for child in childNodes
+        def printTree indent=0
+          tree = "\n|%s%s" % [' '* indent, self.to_s]
+          for child in childNodes
             tree += child.printTree(indent + 2)
+          end
+          return tree
         end
-        return tree
-    end
 
-    def hasContent
-        return (childNodes.length > 0)
-    end
-end
+        def hasContent
+          return (childNodes.length > 0)
+        end
+      end
 
-class Element < Node
-    def to_s
-       "<%s>" % name
-    end
+      class Element < Node
+        def to_s
+           "<%s>" % name
+        end
 
-    def printTree indent=0
-        tree = "\n|%s%s" % [' '* indent, self.to_s]
-        indent += 2
-        for name, value in attributes
+        def printTree indent=0
+          tree = "\n|%s%s" % [' '* indent, self.to_s]
+          indent += 2
+          for name, value in attributes
             tree += "\n|%s%s=\"%s\"" % [' ' * indent, name, value]
-        end
-        for child in childNodes
+          end
+          for child in childNodes
             tree += child.printTree(indent)
+          end
+          return tree
         end
-        return tree
-    end
-end
+      end
 
-class Document < Node
-    def to_s
-       "#document"
-    end
+      class Document < Node
+        def to_s
+           "#document"
+        end
 
-    def initialize
-        super nil
-    end
+        def initialize
+          super nil
+        end
 
-    def printTree indent=0
-        tree = to_s
-        for child in childNodes
+        def printTree indent=0
+          tree = to_s
+          for child in childNodes
             tree += child.printTree(indent + 2)
+          end
+          return tree
         end
-        return tree
-    end
-end
+      end
 
-class DocumentType < Node
-    def to_s
-       "<!DOCTYPE %s>" % name
-    end
-end
+      class DocumentType < Node
+        def to_s
+           "<!DOCTYPE %s>" % name
+        end
+      end
 
-class DocumentFragment < Element
-    def initialize
-        super nil
-    end
+      class DocumentFragment < Element
+        def initialize
+          super nil
+        end
 
-    def printTree indent=0
-        tree = ""
-        for child in childNodes
+        def printTree indent=0
+          tree = ""
+          for child in childNodes
             tree += child.printTree(indent+2)
+          end
+          return tree
         end
-        return tree
+      end
+
+      class TextNode < Node
+        def initialize value
+          super nil
+          @value = value
+        end
+
+        def to_s
+           '"%s"' % value
+        end
+      end
+
+      class CommentNode < Node
+        def initialize value
+          super nil
+          @value = value
+        end
+
+        def to_s
+          "<!-- %s -->" % value
+        end
+      end
+
+      class TreeBuilder < Base::TreeBuilder
+        def initialize
+          @documentClass = Document
+          @doctypeClass = DocumentType
+          @elementClass = Element
+          @commentClass = CommentNode
+          @fragmentClass = DocumentFragment
+        end
+
+        def testSerializer node
+          node.printTree()
+        end
+
+        def getFragment
+          @document = super
+          return @document.childNodes
+        end
+      end
+
     end
-end
-
-class TextNode < Node
-    def initialize value
-        super nil
-        @value = value
-    end
-
-    def to_s
-       '"%s"' % value
-    end
-end
-
-class CommentNode < Node
-    def initialize value
-        super nil
-        @value = value
-    end
-
-    def to_s
-        "<!-- %s -->" % value
-    end
-end
-
-class TreeBuilder < Base::TreeBuilder
-    def initialize
-        @documentClass = Document
-        @doctypeClass = DocumentType
-        @elementClass = Element
-        @commentClass = CommentNode
-        @fragmentClass = DocumentFragment
-    end
-
-    def testSerializer node
-        node.printTree()
-    end
-
-    def getFragment
-        @document = super
-        return @document.childNodes
-    end
-end
-
-end
-end
+  end
 end
diff --git a/vendor/plugins/HTML5lib/tests/preamble.rb b/vendor/plugins/HTML5lib/tests/preamble.rb
index d6c856f4..6e2d5a27 100644
--- a/vendor/plugins/HTML5lib/tests/preamble.rb
+++ b/vendor/plugins/HTML5lib/tests/preamble.rb
@@ -7,5 +7,17 @@ $:.unshift File.join(File.dirname(File.dirname(__FILE__)),'lib')
 $:.unshift File.dirname(__FILE__)
 
 def html5lib_test_files(subdirectory)
-    Dir[File.join(HTML5LIB_BASE, 'tests', subdirectory, '*.*')]
+  Dir[File.join(HTML5LIB_BASE, 'tests', subdirectory, '*.*')]
+end
+
+begin
+  require 'jsonx'
+rescue LoadError
+  class JSON
+    def self.parse json
+      json.gsub! /"\s*:/, '"=>'
+      json.gsub!(/\\u[0-9a-fA-F]{4}/) {|x| [x[2..-1].to_i(16)].pack('U')}
+      eval json
+    end
+  end
 end
diff --git a/vendor/plugins/HTML5lib/tests/test_encoding.rb b/vendor/plugins/HTML5lib/tests/test_encoding.rb
index 6e973299..384887c7 100755
--- a/vendor/plugins/HTML5lib/tests/test_encoding.rb
+++ b/vendor/plugins/HTML5lib/tests/test_encoding.rb
@@ -11,7 +11,7 @@ begin
     def test_chardet
         File.open(File.join(HTML5LIB_BASE, 'tests', 'encoding', 'chardet', 'test_big5.txt')) do |file|
             stream = HTML5lib::HTMLInputStream.new(file, :chardet => true)
-            assert_equal 'big5', stream.charEncoding.downcase
+            assert_equal 'big5', stream.char_encoding.downcase
         end
     end
 rescue LoadError
@@ -28,7 +28,7 @@ end
 
             define_method 'test_%s_%d' % [ test_name, index + 1 ] do
                 stream = HTML5lib::HTMLInputStream.new(input, :chardet => false)
-                assert_equal encoding.downcase, stream.charEncoding.downcase, input
+                assert_equal encoding.downcase, stream.char_encoding.downcase, input
             end
         end
     end
diff --git a/vendor/plugins/HTML5lib/tests/test_lxp.rb b/vendor/plugins/HTML5lib/tests/test_lxp.rb
index 7f1a4f70..52792244 100755
--- a/vendor/plugins/HTML5lib/tests/test_lxp.rb
+++ b/vendor/plugins/HTML5lib/tests/test_lxp.rb
@@ -6,19 +6,19 @@ XMLELEM = /<(\w+\s*)((?:[-:\w]+="[^"]*"\s*)+)(\/?)>/
 SORTATTRS = '<#{$1+$2.split.sort.join(' ')+$3}>'
 
 def assert_xml_equal(input, expected=nil, parser=HTML5lib::XMLParser)
-    document = parser.parse(input.chomp).root
-    if not expected
-        expected = input.chomp.gsub(XMLELEM,SORTATTRS)
-        expected = expected.gsub(/&#(\d+);/) {[$1.to_i].pack('U')}
-        output = document.to_s.gsub(/'/,'"').gsub(XMLELEM,SORTATTRS)
-        assert_equal(expected, output)
-    else
-        assert_equal(expected, document.to_s.gsub(/'/,'"'))
-    end
+  document = parser.parse(input.chomp).root
+  if not expected
+    expected = input.chomp.gsub(XMLELEM,SORTATTRS)
+    expected = expected.gsub(/&#(\d+);/) {[$1.to_i].pack('U')}
+    output = document.to_s.gsub(/'/,'"').gsub(XMLELEM,SORTATTRS)
+    assert_equal(expected, output)
+  else
+    assert_equal(expected, document.to_s.gsub(/'/,'"'))
+  end
 end
 
 def assert_xhtml_equal(input, expected=nil, parser=HTML5lib::XHTMLParser)
-      assert_xml_equal(input, expected, parser)
+  assert_xml_equal(input, expected, parser)
 end
 
 class BasicXhtml5Test < Test::Unit::TestCase
@@ -27,8 +27,8 @@ class BasicXhtml5Test < Test::Unit::TestCase
     assert_xhtml_equal(
       '<title>Xhtml</title><b><i>content</b></i>',
       '<html xmlns="http://www.w3.org/1999/xhtml">' +
-        '<head><title>Xhtml</title></head>' + 
-        '<body><b><i>content</i></b></body>' +
+      '<head><title>Xhtml</title></head>' + 
+      '<body><b><i>content</i></b></body>' +
       '</html>')
   end
 
@@ -36,8 +36,8 @@ class BasicXhtml5Test < Test::Unit::TestCase
     assert_xhtml_equal(
       '<title>mdash</title>A &mdash B',
       '<html xmlns="http://www.w3.org/1999/xhtml">' +
-        '<head><title>mdash</title></head>' + 
-        '<body>A '+ [0x2014].pack('U') + ' B</body>' +
+      '<head><title>mdash</title></head>' + 
+      '<body>A '+ [0x2014].pack('U') + ' B</body>' +
       '</html>')
   end
 end
@@ -70,24 +70,24 @@ class OpmlTest < Test::Unit::TestCase
   def test_mixedCaseElement
     assert_xml_equal(
       '<opml version="1.0">' +
-        '<head><ownerName>Dave Winer</ownerName></head>' +
+      '<head><ownerName>Dave Winer</ownerName></head>' +
       '</opml>')
   end
 
   def test_mixedCaseAttribute
     assert_xml_equal(
       '<opml version="1.0">' +
-        '<body><outline isComment="true"/></body>' +
+      '<body><outline isComment="true"/></body>' +
       '</opml>')
   end
 
   def test_malformed
     assert_xml_equal(
       '<opml version="1.0">' +
-        '<body><outline text="Odds & Ends"/></body>' +
+      '<body><outline text="Odds & Ends"/></body>' +
       '</opml>',
       '<opml version="1.0">' +
-        '<body><outline text="Odds &amp; Ends"/></body>' +
+      '<body><outline text="Odds &amp; Ends"/></body>' +
       '</opml>')
   end
 end
@@ -100,45 +100,45 @@ class XhtmlTest < Test::Unit::TestCase
 <head><title>MathML</title></head>
 <body>
   <math xmlns="http://www.w3.org/1998/Math/MathML">
+  <mrow>
+    <mi>x</mi>
+    <mo>=</mo>
+
+    <mfrac>
     <mrow>
-      <mi>x</mi>
-      <mo>=</mo>
+      <mrow>
+      <mo>-</mo>
+      <mi>b</mi>
+      </mrow>
+      <mo>&#177;</mo>
+      <msqrt>
 
-      <mfrac>
+      <mrow>
+        <msup>
+        <mi>b</mi>
+        <mn>2</mn>
+        </msup>
+        <mo>-</mo>
         <mrow>
-          <mrow>
-            <mo>-</mo>
-            <mi>b</mi>
-          </mrow>
-          <mo>&#177;</mo>
-          <msqrt>
 
-            <mrow>
-              <msup>
-                <mi>b</mi>
-                <mn>2</mn>
-              </msup>
-              <mo>-</mo>
-              <mrow>
-
-                <mn>4</mn>
-                <mo>&#8290;</mo>
-                <mi>a</mi>
-                <mo>&#8290;</mo>
-                <mi>c</mi>
-              </mrow>
-            </mrow>
-
-          </msqrt>
+        <mn>4</mn>
+        <mo>&#8290;</mo>
+        <mi>a</mi>
+        <mo>&#8290;</mo>
+        <mi>c</mi>
         </mrow>
-        <mrow>
-          <mn>2</mn>
-          <mo>&#8290;</mo>
-          <mi>a</mi>
-        </mrow>
-      </mfrac>
+      </mrow>
 
+      </msqrt>
     </mrow>
+    <mrow>
+      <mn>2</mn>
+      <mo>&#8290;</mo>
+      <mi>a</mi>
+    </mrow>
+    </mfrac>
+
+  </mrow>
   </math>
 </body></html>
 EOX
@@ -150,11 +150,11 @@ EOX
 <head><title>SVG</title></head>
 <body>
   <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 100 100">
-    <path d="M38,38c0-12,24-15,23-2c0,9-16,13-16,23v7h11v-4c0-9,17-12,17-27
-             c-2-22-45-22-45,3zM45,70h11v11h-11z" fill="#371">
-    </path>
-    <circle cx="50" cy="50" r="45" fill="none" stroke="#371" stroke-width="10">
-    </circle>
+  <path d="M38,38c0-12,24-15,23-2c0,9-16,13-16,23v7h11v-4c0-9,17-12,17-27
+       c-2-22-45-22-45,3zM45,70h11v11h-11z" fill="#371">
+  </path>
+  <circle cx="50" cy="50" r="45" fill="none" stroke="#371" stroke-width="10">
+  </circle>
 
   </svg>
 </body></html>
@@ -167,24 +167,24 @@ EOX
 <head><title>XLINK</title></head>
 <body>
   <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 100 100">
-    <defs xmlns:l="http://www.w3.org/1999/xlink">
-      <radialGradient id="s1" fx=".4" fy=".2" r=".7">
-        <stop stop-color="#FE8"/>
-        <stop stop-color="#D70" offset="1"/>
-      </radialGradient>
-      <radialGradient id="s2" fx=".8" fy=".5" l:href="#s1"/>
-      <radialGradient id="s3" fx=".5" fy=".9" l:href="#s1"/>
-      <radialGradient id="s4" fx=".1" fy=".5" l:href="#s1"/>
-    </defs>
-    <g stroke="#940">
-      <path d="M73,29c-37-40-62-24-52,4l6-7c-8-16,7-26,42,9z" fill="url(#s1)"/>
-      <path d="M47,8c33-16,48,21,9,47l-6-5c38-27,20-44,5-37z" fill="url(#s2)"/>
-      <path d="M77,32c22,30,10,57-39,51l-1-8c3,3,67,5,36-36z" fill="url(#s3)"/>
+  <defs xmlns:l="http://www.w3.org/1999/xlink">
+    <radialGradient id="s1" fx=".4" fy=".2" r=".7">
+    <stop stop-color="#FE8"/>
+    <stop stop-color="#D70" offset="1"/>
+    </radialGradient>
+    <radialGradient id="s2" fx=".8" fy=".5" l:href="#s1"/>
+    <radialGradient id="s3" fx=".5" fy=".9" l:href="#s1"/>
+    <radialGradient id="s4" fx=".1" fy=".5" l:href="#s1"/>
+  </defs>
+  <g stroke="#940">
+    <path d="M73,29c-37-40-62-24-52,4l6-7c-8-16,7-26,42,9z" fill="url(#s1)"/>
+    <path d="M47,8c33-16,48,21,9,47l-6-5c38-27,20-44,5-37z" fill="url(#s2)"/>
+    <path d="M77,32c22,30,10,57-39,51l-1-8c3,3,67,5,36-36z" fill="url(#s3)"/>
 
-      <path d="M58,84c-4,20-38-4-8-24l-6-5c-36,43,15,56,23,27z" fill="url(#s4)"/>
-      <path d="M40,14c-40,37-37,52-9,68l1-8c-16-13-29-21,16-56z" fill="url(#s1)"/>
-      <path d="M31,33c19,23,20,7,35,41l-9,1.7c-4-19-8-14-31-37z" fill="url(#s2)"/>
-    </g>
+    <path d="M58,84c-4,20-38-4-8-24l-6-5c-36,43,15,56,23,27z" fill="url(#s4)"/>
+    <path d="M40,14c-40,37-37,52-9,68l1-8c-16-13-29-21,16-56z" fill="url(#s1)"/>
+    <path d="M31,33c19,23,20,7,35,41l-9,1.7c-4-19-8-14-31-37z" fill="url(#s2)"/>
+  </g>
   </svg>
 </body></html>
 EOX
diff --git a/vendor/plugins/HTML5lib/tests/test_parser.rb b/vendor/plugins/HTML5lib/tests/test_parser.rb
index f1f9484d..ab26cb07 100644
--- a/vendor/plugins/HTML5lib/tests/test_parser.rb
+++ b/vendor/plugins/HTML5lib/tests/test_parser.rb
@@ -7,8 +7,8 @@ require 'html5lib/html5parser'
 $tree_types_to_test = ['simpletree', 'rexml']
 
 begin
-    require 'hpricot'
-    $tree_types_to_test.push('hpricot')
+  require 'hpricot'
+  $tree_types_to_test.push('hpricot')
 rescue LoadError
 end
 
@@ -19,90 +19,90 @@ puts 'Testing: ' + $tree_types_to_test * ', '
 
 class Html5ParserTestCase < Test::Unit::TestCase
 
-    def self.startswith?(a, b)
-        b[0... a.length] == a
-    end
+  def self.startswith?(a, b)
+    b[0... a.length] == a
+  end
 
-    def self.parseTestcase(data)
-        innerHTML = nil
-        input = []
-        output = []
-        errors = []
-        currentList = input
-        data.split(/\n/).each do |line|
-            if !line.empty? and !startswith?("#errors", line) and
-              !startswith?("#document", line) and
-              !startswith?("#data", line) and
-              !startswith?("#document-fragment", line)
+  def self.parseTestcase(data)
+    innerHTML = nil
+    input = []
+    output = []
+    errors = []
+    currentList = input
+    data.split(/\n/).each do |line|
+      if !line.empty? and !startswith?("#errors", line) and
+        !startswith?("#document", line) and
+        !startswith?("#data", line) and
+        !startswith?("#document-fragment", line)
 
-                if currentList == output and startswith?("|", line)
-                    currentList.push(line[2..-1])
-                else
-                    currentList.push(line)
-                end
-            elsif line == "#errors"
-                currentList = errors
-            elsif line == "#document" or startswith?("#document-fragment", line)
-                if startswith?("#document-fragment", line)
-                    innerHTML = line[19..-1]
-                    raise AssertionError unless innerHTML
-                end
-                currentList = output
-            end
+        if currentList == output and startswith?("|", line)
+          currentList.push(line[2..-1])
+        else
+          currentList.push(line)
         end
-        return innerHTML, input.join("\n"), output.join("\n"), errors
-    end
-    
-    # convert the output of str(document) to the format used in the testcases
-    def convertTreeDump(treedump)
-        treedump.split(/\n/)[1..-1].map { |line| (line.length > 2 and line[0] == ?|) ? line[3..-1] : line }.join("\n")
-    end
-
-    def sortattrs(output)
-        output.gsub(/^(\s+)\w+=.*(\n\1\w+=.*)+/) { |match| match.split("\n").sort.join("\n") }
-    end
-
-    html5lib_test_files('tree-construction').each do |test_file|
-
-        test_name = File.basename(test_file).sub('.dat', '')
-
-        File.read(test_file).split("#data\n").each_with_index do |data, index|
-            next if data.empty?
-       
-            innerHTML, input, expected_output, expected_errors = parseTestcase(data)
-
-            $tree_types_to_test.each do |tree_name|
-                define_method 'test_%s_%d_%s' % [ test_name, index + 1, tree_name ] do
-
-                    parser = HTML5lib::HTMLParser.new(:tree => HTML5lib::TreeBuilders.getTreeBuilder(tree_name))
-                
-                    if innerHTML
-                        parser.parseFragment(input, innerHTML)
-                    else
-                        parser.parse(input)
-                    end
-                
-                    actual_output = convertTreeDump(parser.tree.testSerializer(parser.tree.document))
-
-                    assert_equal sortattrs(expected_output), sortattrs(actual_output), [
-                        'Input:', input,
-                        'Expected:', expected_output,
-                        'Recieved:', actual_output
-                    ].join("\n")
-
-                    if $CHECK_PARSER_ERRORS
-                        actual_errors = parser.errors.map do |(line, col), message|
-                            'Line: %i Col: %i %s' % [line, col, message]
-                        end
-                        assert_equal parser.errors.length, expected_errors.length, [
-                            'Expected errors:', expected_errors.join("\n"),
-                            'Actual errors:', actual_errors.join("\n") 
-                        ].join("\n")
-                    end
-                    
-                end
-            end
+      elsif line == "#errors"
+        currentList = errors
+      elsif line == "#document" or startswith?("#document-fragment", line)
+        if startswith?("#document-fragment", line)
+          innerHTML = line[19..-1]
+          raise AssertionError unless innerHTML
         end
+        currentList = output
+      end
     end
+    return innerHTML, input.join("\n"), output.join("\n"), errors
+  end
+  
+  # convert the output of str(document) to the format used in the testcases
+  def convertTreeDump(treedump)
+    treedump.split(/\n/)[1..-1].map { |line| (line.length > 2 and line[0] == ?|) ? line[3..-1] : line }.join("\n")
+  end
+
+  def sortattrs(output)
+    output.gsub(/^(\s+)\w+=.*(\n\1\w+=.*)+/) { |match| match.split("\n").sort.join("\n") }
+  end
+
+  html5lib_test_files('tree-construction').each do |test_file|
+
+    test_name = File.basename(test_file).sub('.dat', '')
+
+    File.read(test_file).split("#data\n").each_with_index do |data, index|
+      next if data.empty?
+     
+      innerHTML, input, expected_output, expected_errors = parseTestcase(data)
+
+      $tree_types_to_test.each do |tree_name|
+        define_method 'test_%s_%d_%s' % [ test_name, index + 1, tree_name ] do
+
+          parser = HTML5lib::HTMLParser.new(:tree => HTML5lib::TreeBuilders.getTreeBuilder(tree_name))
+        
+          if innerHTML
+            parser.parseFragment(input, innerHTML)
+          else
+            parser.parse(input)
+          end
+        
+          actual_output = convertTreeDump(parser.tree.testSerializer(parser.tree.document))
+
+          assert_equal sortattrs(expected_output), sortattrs(actual_output), [
+            'Input:', input,
+            'Expected:', expected_output,
+            'Recieved:', actual_output
+          ].join("\n")
+
+          if $CHECK_PARSER_ERRORS
+            actual_errors = parser.errors.map do |(line, col), message|
+              'Line: %i Col: %i %s' % [line, col, message]
+            end
+            assert_equal parser.errors.length, expected_errors.length, [
+              'Expected errors:', expected_errors.join("\n"),
+              'Actual errors:', actual_errors.join("\n") 
+            ].join("\n")
+          end
+          
+        end
+      end
+    end
+  end
 
 end
diff --git a/vendor/plugins/HTML5lib/tests/test_sanitizer.rb b/vendor/plugins/HTML5lib/tests/test_sanitizer.rb
index 619253f8..3b440071 100644
--- a/vendor/plugins/HTML5lib/tests/test_sanitizer.rb
+++ b/vendor/plugins/HTML5lib/tests/test_sanitizer.rb
@@ -203,4 +203,8 @@ class SanitizeTest < Test::Unit::TestCase
        sanitize_html(%(<img src='vbscript:msgbox("XSS")' />))
   end
 
+  def test_should_handle_astral_plane_characters
+    assert_equal "<p>\360\235\222\265 \360\235\224\270</p>",
+      sanitize_html("<p>&#x1d4b5; &#x1d538;</p>")
+  end
 end
diff --git a/vendor/plugins/HTML5lib/tests/test_tokenizer.rb b/vendor/plugins/HTML5lib/tests/test_tokenizer.rb
index b4ed02d7..5d367a06 100644
--- a/vendor/plugins/HTML5lib/tests/test_tokenizer.rb
+++ b/vendor/plugins/HTML5lib/tests/test_tokenizer.rb
@@ -4,75 +4,63 @@ require 'html5lib/tokenizer'
 
 require 'tokenizer_test_parser'
 
-begin
-  require 'jsonx'
-rescue LoadError
-  class JSON
-    def self.parse json
-      json.gsub! /"\s*:/, '"=>'
-      json.gsub!(/\\u[0-9a-fA-F]{4}/) {|x| [x[2..-1].to_i(16)].pack('U')}
-      eval json
-    end
-  end
-end 
-
 class Html5TokenizerTestCase < Test::Unit::TestCase
 
-    def type_of?(token_name, token)
-        token != 'ParseError' and token_name == token.first
+  def type_of?(token_name, token)
+    token != 'ParseError' and token_name == token.first
+  end
+
+  def convert_attribute_arrays_to_hashes(tokens)
+    tokens.inject([]) do |tokens, token|
+      token[2] = Hash[*token[2].reverse.flatten] if type_of?('StartTag', token)
+      tokens << token
     end
-
-    def convert_attribute_arrays_to_hashes(tokens)
-        tokens.inject([]) do |tokens, token|
-            token[2] = Hash[*token[2].reverse.flatten] if type_of?('StartTag', token)
-            tokens << token
-        end
+  end
+  
+  def concatenate_consecutive_characters(tokens)
+    tokens.inject([]) do |tokens, token|
+      if type_of?('Character', token) and tokens.any? and type_of?('Character', tokens.last)
+        tokens.last[1] = tokens.last[1] + token[1]
+        next tokens
+      end
+      tokens << token
     end
-    
-    def concatenate_consecutive_characters(tokens)
-        tokens.inject([]) do |tokens, token|
-            if type_of?('Character', token) and tokens.any? and type_of?('Character', tokens.last)
-                tokens.last[1] = tokens.last[1] + token[1]
-                next tokens
-            end
-            tokens << token
-        end
-    end
-
-    def tokenizer_test(data)
-        (data['contentModelFlags'] || [:PCDATA]).each do |content_model_flag|
-            message = [
-                'Description:', data['description'],
-                'Input:', data['input'],
-                'Content Model Flag:', content_model_flag ] * "\n"
-
-            assert_nothing_raised message do
-                tokenizer = HTML5lib::HTMLTokenizer.new(data['input'])
-
-                tokenizer.contentModelFlag = content_model_flag.to_sym
-                
-                tokenizer.currentToken = {:type => :startTag, :name => data['lastStartTag']} if data.has_key?('lastStartTag')
-
-                tokens = TokenizerTestParser.new(tokenizer).parse
-
-                actual = concatenate_consecutive_characters(convert_attribute_arrays_to_hashes(tokens))
-
-                expected = concatenate_consecutive_characters(data['output'])
-
-                assert_equal expected, actual, message
-            end
-        end 
-    end
-
-    html5lib_test_files('tokenizer').each do |test_file|
-        test_name = File.basename(test_file).sub('.test', '')
-
-        tests = JSON.parse(File.read(test_file))['tests']
-
-        tests.each_with_index do |data, index|
-            define_method('test_%s_%d' % [test_name, index + 1]) { tokenizer_test data }
-        end
+  end
+
+  def tokenizer_test(data)
+    (data['contentModelFlags'] || [:PCDATA]).each do |content_model_flag|
+      message = [
+        'Description:', data['description'],
+        'Input:', data['input'],
+        'Content Model Flag:', content_model_flag ] * "\n"
+
+      assert_nothing_raised message do
+        tokenizer = HTML5lib::HTMLTokenizer.new(data['input'])
+
+        tokenizer.contentModelFlag = content_model_flag.to_sym
+
+        tokenizer.currentToken = {:type => :startTag, :name => data['lastStartTag']} if data.has_key?('lastStartTag')
+
+        tokens = TokenizerTestParser.new(tokenizer).parse
+
+        actual = concatenate_consecutive_characters(convert_attribute_arrays_to_hashes(tokens))
+
+        expected = concatenate_consecutive_characters(data['output'])
+
+        assert_equal expected, actual, message
+      end
+    end 
+  end
+
+  html5lib_test_files('tokenizer').each do |test_file|
+    test_name = File.basename(test_file).sub('.test', '')
+
+    tests = JSON.parse(File.read(test_file))['tests']
+
+    tests.each_with_index do |data, index|
+      define_method('test_%s_%d' % [test_name, index + 1]) { tokenizer_test data }
     end
+  end
 
 end
 
diff --git a/vendor/plugins/HTML5lib/tests/tokenizer_test_parser.rb b/vendor/plugins/HTML5lib/tests/tokenizer_test_parser.rb
index 8f6db031..d48c458f 100644
--- a/vendor/plugins/HTML5lib/tests/tokenizer_test_parser.rb
+++ b/vendor/plugins/HTML5lib/tests/tokenizer_test_parser.rb
@@ -1,62 +1,62 @@
 require 'html5lib/constants'
 
 class TokenizerTestParser
-    def initialize(tokenizer)
-        @tokenizer = tokenizer
+  def initialize(tokenizer)
+    @tokenizer = tokenizer
+  end
+
+  def parse
+    @outputTokens = []
+
+    debug = nil
+    for token in @tokenizer
+      debug = token.inspect if token[:type] == :ParseError
+      send ('process' + token[:type].to_s), token
     end
 
-    def parse
-        @outputTokens = []
+    return @outputTokens
+  end
 
-        debug = nil
-        for token in @tokenizer
-            debug = token.inspect if token[:type] == :ParseError
-            send ('process' + token[:type].to_s), token
-        end
+  def processDoctype(token)
+    @outputTokens.push(["DOCTYPE", token[:name], token[:data]])
+  end
 
-        return @outputTokens
+  def processStartTag(token)
+    @outputTokens.push(["StartTag", token[:name], token[:data]])
+  end
+
+  def processEmptyTag(token)
+    if not HTML5lib::VOID_ELEMENTS.include? token[:name]
+      @outputTokens.push("ParseError")
     end
+    @outputTokens.push(["StartTag", token[:name], token[:data]])
+  end
 
-    def processDoctype(token)
-        @outputTokens.push(["DOCTYPE", token[:name], token[:data]])
+  def processEndTag(token)
+    if token[:data].length > 0
+      self.processParseError(token)
     end
+    @outputTokens.push(["EndTag", token[:name]])
+  end
 
-    def processStartTag(token)
-        @outputTokens.push(["StartTag", token[:name], token[:data]])
-    end
+  def processComment(token)
+    @outputTokens.push(["Comment", token[:data]])
+  end
 
-    def processEmptyTag(token)
-        if not HTML5lib::VOID_ELEMENTS.include? token[:name]
-            @outputTokens.push("ParseError")
-        end
-        @outputTokens.push(["StartTag", token[:name], token[:data]])
-    end
+  def processCharacters(token)
+    @outputTokens.push(["Character", token[:data]])
+  end
 
-    def processEndTag(token)
-        if token[:data].length > 0
-            self.processParseError(token)
-        end
-        @outputTokens.push(["EndTag", token[:name]])
-    end
+  alias processSpaceCharacters processCharacters
 
-    def processComment(token)
-        @outputTokens.push(["Comment", token[:data]])
-    end
+  def processCharacters(token)
+    @outputTokens.push(["Character", token[:data]])
+  end
 
-    def processCharacters(token)
-        @outputTokens.push(["Character", token[:data]])
-    end
+  def processEOF(token)
+  end
 
-    alias processSpaceCharacters processCharacters
-
-    def processCharacters(token)
-        @outputTokens.push(["Character", token[:data]])
-    end
-
-    def processEOF(token)
-    end
-
-    def processParseError(token)
-        @outputTokens.push("ParseError")
-    end
+  def processParseError(token)
+    @outputTokens.push("ParseError")
+  end
 end