Bring up to current.

2007-01-22 08:36:51 -06:00 · 2007-01-22 08:36:51 -06:00 · b19e1e4f47
commit b19e1e4f47
parent 69b62b6f33
71 changed files with 8305 additions and 39 deletions
--- a/app/controllers/application.rb
+++ b/app/controllers/application.rb
@ -48,6 +48,7 @@ class ApplicationController < ActionController::Base
    '.pdf' => 'application/pdf',
    '.png' => 'image/png',
    '.txt' => 'text/plain',
    '.tex' => 'text/plain',
    '.zip' => 'application/zip'
  } unless defined? FILE_TYPES
@ -114,7 +115,7 @@ class ApplicationController < ActionController::Base
  def rescue_action_in_public(exception)
    render :status => 500, :text => <<-EOL
-      <html><body>
+      <html xmlns="http://www.w3.org/1999/xhtml"><body>
        <h2>Internal Error</h2>
        <p>An application error occurred while processing your request.</p>
        <!-- \n#{exception}\n#{exception.backtrace.join("\n")}\n -->
@ -145,8 +146,10 @@ class ApplicationController < ActionController::Base
  def set_content_type_header
    if %w(rss_with_content rss_with_headlines).include?(action_name)
      @response.headers['Content-Type'] = 'text/xml; charset=UTF-8'
    elsif %w(tex).include?(action_name)
      @response.headers['Content-Type'] = 'text/plain; charset=UTF-8'
    else
-      @response.headers['Content-Type'] = 'text/html; charset=UTF-8'
+      @response.headers['Content-Type'] = 'application/xhtml+xml; charset=UTF-8'
    end
  end
--- a/app/controllers/wiki_controller.rb
+++ b/app/controllers/wiki_controller.rb
@ -9,7 +9,7 @@ class WikiController < ApplicationController
  caches_action :show, :published, :authors, :recently_revised, :list
  cache_sweeper :revision_sweeper
-  layout 'default', :except => [:rss_feed, :rss_with_content, :rss_with_headlines, :tex,  :export_tex, :export_html]
+  layout 'default', :except => [:rss_feed, :rss_with_content, :rss_with_headlines, :tex, :pdf, :export_tex, :export_html]
  def index
    if @web_name
@ -280,8 +280,12 @@ class WikiController < ApplicationController
  end
  def tex
    if @web.markup == :markdownMML
      @tex_content = Maruku.new(@page.content).to_latex
    else
    @tex_content = RedClothForTex.new(@page.content).to_tex
  end
  end
  protected
@ -305,8 +309,12 @@ class WikiController < ApplicationController
  end
  def export_page_to_tex(file_path)
-    tex
+    if @web.markup == :markdownMML
-    File.open(file_path, 'w') { |f| f.write(render_to_string(:template => 'wiki/tex', :layout => false)) }
+      @tex_content = Maruku.new(@page.content).to_latex
    else
      @tex_content = RedClothForTex.new(@page.content).to_tex
    end
    File.open(file_path, 'w') { |f| f.write(render_to_string(:template => 'wiki/tex', :layout => 'tex')) }
  end
  def export_pages_as_zip(file_type, &block)
@ -396,7 +404,11 @@ class WikiController < ApplicationController
  def render_tex_web
    @web.select.by_name.inject({}) do |tex_web, page|
      if  @web.markup == :markdownMML
        tex_web[page.name] = Maruku.new(page.content).to_latex
      else
      tex_web[page.name] = RedClothForTex.new(page.content).to_tex
      end
      tex_web
    end
  end
--- a/app/helpers/application_helper.rb
+++ b/app/helpers/application_helper.rb
@ -23,7 +23,7 @@ module ApplicationHelper
        if element.last != selected
          options << "<option value=\"#{element.last}\">#{element.first}</option>"
        else
-          options << "<option value=\"#{element.last}\" selected>#{element.first}</option>"
+          options << "<option value=\"#{element.last}\" selected=\"selected\">#{element.first}</option>"
        end
      else
        options << ((element != selected) ? "<option>#{element}</option>" : "<option selected>#{element}</option>")
--- a/app/views/admin/create_system.rhtml
+++ b/app/views/admin/create_system.rhtml
@ -7,7 +7,7 @@
 </p>
 <%= form_tag({ :controller => 'admin', :action => 'create_system' },
-             { 'id' => 'setup', 'method' => 'post', 'onSubmit' => 'return validateSetup()', 
+             { 'id' => 'setup', 'method' => 'post', 'onsubmit' => 'return validateSetup()', 
               'accept-charset' => 'utf-8' })
 %>
 <ol class="setup">
@ -22,9 +22,9 @@
    </div>
    <div class="inputBox">
      Name: <input type="text" id="web_name" name="web_name" value="Wiki" 
-            onChange="proposeAddress();" onClick="this.value == 'Wiki' ? this.value = '' : true" /> 
+            onchange="proposeAddress();" onclick="this.value == 'Wiki' ? this.value = '' : true" /> 
      &nbsp;&nbsp;
-      Address: <input type="text" id="web_address" name="web_address" onChange="cleanAddress();"
+      Address: <input type="text" id="web_address" name="web_address" onchange="cleanAddress();"
               value="wiki" />
    </div>
  </li>
--- a/app/views/admin/create_web.rhtml
+++ b/app/views/admin/create_web.rhtml
@ -7,7 +7,7 @@
 <%= form_tag({ :controller => 'admin', :action => 'create_web' },
             { 'id' => 'setup', 'method' => 'post', 
-               'onSubmit' => 'cleanAddress(); return validateSetup()',
+               'onsubmit' => 'cleanAddress(); return validateSetup()',
               'accept-charset' => 'utf-8' })
 %>
@ -21,9 +21,9 @@
      The address can only consist of letters and digits.
    </div>
    <div class="inputBox">
-      Name: <input type="text" id="web_name" name="name" onChange="proposeAddress();" />
+      Name: <input type="text" id="web_name" name="name" onchange="proposeAddress();" />
      &nbsp;&nbsp;
-      Address: <input type="text" id="web_address" name="address" onChange="cleanAddress();" />
+      Address: <input type="text" id="web_address" name="address" onchange="cleanAddress();" />
    </div>
  </li>
 </ol>
--- a/app/views/admin/edit_web.rhtml
+++ b/app/views/admin/edit_web.rhtml
@ -2,7 +2,7 @@
 <%= form_tag({ :controller => 'admin', :action => 'edit_web', :web => @web.address },
             { 'id' => 'setup', 'method' => 'post', 
-               'onSubmit' => 'cleanAddress(); return validateSetup()',
+               'onsubmit' => 'cleanAddress(); return validateSetup()',
               'accept-charset' => 'utf-8' })
 %>
@ -15,9 +15,9 @@
  <div class="inputBox">
    Name: <input type="text" id="name" name="name" class="disableAutoComplete" value="<%= @web.name %>" 
-                 onChange="proposeAddress();" /> &nbsp;&nbsp;
+                 onchange="proposeAddress();" /> &nbsp;&nbsp;
    Address: <input type="text" class="disableAutoComplete" id="address" name="address" value="<%= @web.address %>" 
-                    onChange="cleanAddress();" />
+                    onchange="cleanAddress();" />
    <small><em>(Letters and digits only)</em></small>
  </div>
@ -25,7 +25,7 @@
  <div class="inputBox">
    Markup:
    <select name="markup">
-      <%= html_options({'Textile' => :textile, 'Markdown' => :markdown, 'Mixed' => :mixed, 
+      <%= html_options({'Textile' => :textile, 'Markdown' => :markdown, 'Markdown+itex2MML' => :markdownMML, 'Mixed' => :mixed, 
              'RDoc' => :rdoc }, @web.markup) %>
    </select>
@ -64,7 +64,7 @@
    </p>
    <a href="#" 
-       onClick="document.getElementById('additionalStyle').style.display='block';return false;">
+       onclick="document.getElementById('additionalStyle').style.display='block';return false;">
    Stylesheet tweaks &gt;&gt;</a>
    <small><em>
    - add or change styles used by this web; styles defined here take precedence over 
@ -120,7 +120,7 @@
 <%= form_tag({:controller => 'admin', :web => @web.address, :action => 'remove_orphaned_pages'},
        { :id => 'remove_orphaned_pages', 
-          :onSubmit => "return checkSystemPassword(document.getElementById('system_password_orphaned').value)",
+          :onsubmit => "return checkSystemPassword(document.getElementById('system_password_orphaned').value)",
          'accept-charset' => 'utf-8' }) 
 %>
  <p align="right">
--- a/app/views/file/import.rhtml
+++ b/app/views/file/import.rhtml
@ -13,7 +13,7 @@
  <p>
    <input type="submit" value="Update" /> as 
    <input type="text" name="author" id="authorName" value="<%= @author %>" 
-        onClick="this.value == 'AnonymousCoward' ? this.value = '' : true" />
+        onclick="this.value == 'AnonymousCoward' ? this.value = '' : true" />
 	<% if @page %>
      | <%= link_to 'Cancel', :web => @web.address, :action => 'file'%> <small>(unlocks page)</small>
    <% end %>
--- a/app/views/layouts/default.rhtml
+++ b/app/views/layouts/default.rhtml
@ -1,6 +1,4 @@
-<!DOCTYPE html
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.1 plus MathML 2.0//EN" "http://www.w3.org/Math/DTD/mathml2/xhtml-math11-f.dtd" >
 PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
 "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
 <html xmlns="http://www.w3.org/1999/xhtml">
 <head>
  <title>
--- a/app/views/layouts/tex.rhtml
+++ b/app/views/layouts/tex.rhtml
@ -0,0 +1 @@
 <%= @content_for_layout %>
--- a/app/views/markdownMML_help.rhtml
+++ b/app/views/markdownMML_help.rhtml
@ -0,0 +1,13 @@
 <h3>Markdown + itex2MML  formatting tips (<a target="_new" href="http://daringfireball.net/projects/markdown/syntax">advanced</a>)</h3>
 <table cellspacing="0" cellpadding="0">
  <tr><td>_your text_</td><td class="arrow">&rarr;</td><td><em>your text</em></td></tr>
  <tr><td>**your text**</td><td class="arrow">&rarr;</td><td><strong>your text</strong></td></tr>
  <tr><td>`my code`</td><td class="arrow">&rarr;</td><td><code>my code</code></td></tr>
  <tr><td>* Bulleted list<br />* Second item</td><td class="arrow">&rarr;</td><td>&#8226; Bulleted list<br />&#8226; Second item</td></tr>
  <tr><td>1. Numbered list<br />1. Second item</td><td class="arrow">&rarr;</td><td>1. Numbered list<br />2. Second item</td></tr>
  <tr><td>[link name](URL)</td><td class="arrow">&rarr;</td><td><a href="URL">link name</a></td></tr>
  <tr><td>***</td><td class="arrow">&rarr;</td><td>Horizontal ruler</td></tr>
  <tr><td>&lt;http://url><br />&lt;email@add.com></td><td class="arrow">&rarr;</td><td>Auto-linked</td></tr>
  <tr><td>![Alt text](URL)</td><td class="arrow">&rarr;</td><td>Image</td></tr>
 </table>
 <p>For a complete list of LaTeX commands supported here, see the <a href="http://golem.ph.utexas.edu/~distler/blog/itex2MMLcommands.html">itex2MML Commands Summary</a>.</p>
--- a/app/views/textile_help.rhtml
+++ b/app/views/textile_help.rhtml
@ -1,4 +1,4 @@
-<h3>Textile formatting tips (<a href="http://hobix.com/textile/quick.html" onClick="quickRedReference(); return false;">advanced</a>)</h3>
+<h3>Textile formatting tips (<a href="http://hobix.com/textile/quick.html" onclick="quickRedReference(); return false;">advanced</a>)</h3>
 <table cellspacing="0" cellpadding="0">
  <tr><td>_your text_</td><td class="arrow">&rarr;</td><td><em>your text</em></td></tr>
  <tr><td>*your text*</td><td class="arrow">&rarr;</td><td><strong>your text</strong></td></tr>
--- a/app/views/wiki/edit.rhtml
+++ b/app/views/wiki/edit.rhtml
@ -11,7 +11,7 @@
 <div id="editForm">
 	<%= form_tag({ :action => 'save', :web => @web.address, :id => @page.name },
-	             { 'id' => 'editForm', 'method' => 'post', 'onSubmit' => 'cleanAuthorName()',
+	             { 'id' => 'editForm', 'method' => 'post', 'onsubmit' => 'cleanAuthorName()',
 	               'accept-charset' => 'utf-8' }) %>
 		<textarea name="content" id="content"><%= h(@flash[:content] || @page.content) %></textarea>
--- a/app/views/wiki/new.rhtml
+++ b/app/views/wiki/new.rhtml
@ -11,7 +11,7 @@
 <div id="editForm">
 	<%= form_tag({ :action => 'save', :web => @web.address, :id => @page_name },
-	        { 'id' => 'editForm', 'method' => 'post', 'onSubmit' => 'cleanAuthorName();', 'accept-charset' => 'utf-8' }) %>
+	        { 'id' => 'editForm', 'method' => 'post', 'onsubmit' => 'cleanAuthorName();', 'accept-charset' => 'utf-8' }) %>
 	    <textarea name="content" id="content"><%= h(@flash[:content] || '') %></textarea>
 		<div id="editFormButtons">
--- a/app/views/wiki/page.rhtml
+++ b/app/views/wiki/page.rhtml
@ -37,7 +37,7 @@
    <%= link_to('Print',
            { :web => @web.address, :action => 'print', :id => @page.name },
            { :accesskey => 'p', :name => 'view_print' }) %>
-  <% if defined? RedClothForTex and RedClothForTex.available? and @web.markup == :textile %>
+  <% if defined? RedClothForTex and RedClothForTex.available? and @web.markup == :textile or @web.markup == :markdownMML %>
    | 
    <%= link_to 'TeX', {:web => @web.address, :action => 'tex', :id => @page.name}, 
            {:name => 'view_tex'} %>
--- a/app/views/wiki/rollback.rhtml
+++ b/app/views/wiki/rollback.rhtml
@ -13,13 +13,13 @@
 <div id="editForm">
 	<%= form_tag({:web => @web.address, :action => 'save', :id => @page.name},
-	      { :id => 'editForm', :method => 'post', :onSubmit => 'cleanAuthorName();', 
+	      { :id => 'editForm', :method => 'post', :onsubmit => 'cleanAuthorName();', 
 	        'accept-charset' => 'utf-8' }) %>
        <textarea name="content" id="content"><%= @revision.content %></textarea>
 		<div id="editFormButtons">
 	        <input type="submit" value="Update" accesskey="u" /> as 
 		    <input type="text" name="author" id="authorName" value="<%= @author %>" 
-		        onClick="this.value == 'AnonymousCoward' ? this.value = '' : true" />
+		        onclick="this.value == 'AnonymousCoward' ? this.value = '' : true" />
 		    | 
 			<span>
 				<%= link_to('Cancel', {:web => @web.address, :action => 'cancel_edit', :id => @page.name},
--- a/app/views/wiki/tex.rhtml
+++ b/app/views/wiki/tex.rhtml
@ -1,12 +1,12 @@
 \documentclass[12pt,titlepage]{article}
-\usepackage[danish]{babel}      %danske tekster
+\usepackage{amsmath}
 \usepackage{amsfonts}
 \usepackage[OT1]{fontenc}       %rigtige danske bogstaver...
 \usepackage{a4}
 \usepackage{graphicx}
 \usepackage{ucs}
 \usepackage[utf8x]{inputenc}
-\input epsf 
+\usepackage{hyperref}
 %-------------------------------------------------------------------
--- a/db/production.db.sqlite3
+++ b/db/production.db.sqlite3
--- a/db/schema.rb
+++ b/db/schema.rb
@ -0,0 +1,78 @@
 # This file is autogenerated. Instead of editing this file, please use the
 # migrations feature of ActiveRecord to incrementally modify your database, and
 # then regenerate this schema definition.
 ActiveRecord::Schema.define(:version => 2) do
  create_table "pages", :force => true do |t|
    t.column "created_at", :datetime, :null => false
    t.column "updated_at", :datetime, :null => false
    t.column "web_id", :integer, :default => 0, :null => false
    t.column "locked_by", :string, :limit => 60
    t.column "name", :string, :limit => 60
    t.column "locked_at", :datetime
  end
  create_table "revisions", :force => true do |t|
    t.column "created_at", :datetime, :null => false
    t.column "updated_at", :datetime, :null => false
    t.column "revised_at", :datetime, :null => false
    t.column "page_id", :integer, :default => 0, :null => false
    t.column "content", :text, :default => "", :null => false
    t.column "author", :string, :limit => 60
    t.column "ip", :string, :limit => 60
  end
  add_index "revisions", ["author"], :name => "revisions_author_index"
  add_index "revisions", ["created_at"], :name => "revisions_created_at_index"
  add_index "revisions", ["page_id"], :name => "revisions_page_id_index"
  create_table "sessions", :force => true do |t|
    t.column "session_id", :string
    t.column "data", :text
    t.column "updated_at", :datetime
  end
  add_index "sessions", ["session_id"], :name => "sessions_session_id_index"
  create_table "system", :force => true do |t|
    t.column "password", :string, :limit => 60
  end
  create_table "webs", :force => true do |t|
    t.column "created_at", :datetime, :null => false
    t.column "updated_at", :datetime, :null => false
    t.column "name", :string, :limit => 60, :default => "", :null => false
    t.column "address", :string, :limit => 60, :default => "", :null => false
    t.column "password", :string, :limit => 60
    t.column "additional_style", :string
    t.column "allow_uploads", :integer, :default => 1
    t.column "published", :integer, :default => 0
    t.column "count_pages", :integer, :default => 0
    t.column "markup", :string, :limit => 50, :default => "textile"
    t.column "color", :string, :limit => 6, :default => "008B26"
    t.column "max_upload_size", :integer, :default => 100
    t.column "safe_mode", :integer, :default => 0
    t.column "brackets_only", :integer, :default => 0
  end
  create_table "wiki_files", :force => true do |t|
    t.column "created_at", :datetime, :null => false
    t.column "updated_at", :datetime, :null => false
    t.column "web_id", :integer, :null => false
    t.column "file_name", :string, :null => false
    t.column "description", :string, :null => false
  end
  create_table "wiki_references", :force => true do |t|
    t.column "created_at", :datetime, :null => false
    t.column "updated_at", :datetime, :null => false
    t.column "page_id", :integer, :default => 0, :null => false
    t.column "referenced_name", :string, :limit => 60, :default => "", :null => false
    t.column "link_type", :string, :limit => 1, :default => "", :null => false
  end
  add_index "wiki_references", ["referenced_name"], :name => "wiki_references_referenced_name_index"
  add_index "wiki_references", ["page_id"], :name => "wiki_references_page_id_index"
 end
--- a/9
+++ b/9
@ -1,7 +1,6 @@
-#!/bin/sh
+#!/usr/bin/env ruby
-cd $(dirname $0)
+# Executable file for a gem
-
+# must be same as ./instiki.rb
 export LD_LIBRARY_PATH=./lib/native/linux-x86:$LD_LIBRARY_PATH
 ruby script/server
 load File.dirname(__FILE__) + '/script/server'
--- a/lib/bluecloth_tweaked.rb
+++ b/lib/bluecloth_tweaked.rb
@ -1112,7 +1112,7 @@ class BlueCloth < String
 	### Return a copy of +str+ with angle brackets and ampersands HTML-encoded.
 	def encode_html( str )
-		str.gsub( /&(?!#?[x]?(?:[0-9a-f]+|\w{1,8});)/i, "&amp;" ).
+		str.gsub( /&(?!#?[x]?(?:[0-9a-f]+|\w+);)/i, "&amp;" ).
 			gsub( %r{<(?![a-z/?\$!])}i, "&lt;" )
 	end
--- a/lib/chunks/engines.rb
+++ b/lib/chunks/engines.rb
@ -40,6 +40,14 @@ module Engines
    end
  end
  class MarkdownMML < AbstractEngine
    def mask
      require_dependency 'maruku'
      require_dependency 'maruku/ext/math'
      Maruku.new(@content.delete("\r")).to_html
    end
  end
  class Mixed < AbstractEngine
    def mask
      require_dependency 'redcloth'
@ -57,6 +65,6 @@ module Engines
    end
  end
-  MAP = { :textile => Textile, :markdown => Markdown, :mixed => Mixed, :rdoc => RDoc }
+  MAP = { :textile => Textile, :markdown => Markdown, :markdownMML => MarkdownMML, :mixed => Mixed, :rdoc => RDoc }
  MAP.default = Textile
 end
--- a/lib/maruku.rb
+++ b/lib/maruku.rb
@ -0,0 +1,133 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 require 'rexml/document'
 # :include:MaRuKu.txt
 module MaRuKu
 	module In
 		module Markdown
 			module SpanLevelParser; end
 			module BlockLevelParser; end
 		end
 		# more to come?
 	end
 	module Out
 		# Functions for exporting to MarkDown.
 		module Markdown; end
 		# Functions for exporting to HTML.
 		module HTML; end
 		# Functions for exporting to Latex
 		module Latex; end
 	end
 	# These are strings utilities.
 	module Strings; end
 	module Helpers; end
 	module Errors; end
 	class MDElement
 		include REXML
 		include MaRuKu
 		include Out::Markdown
 		include Out::HTML
 		include Out::Latex
 		include Strings
 		include Helpers
 		include Errors
 	end
 	class MDDocument < MDElement
 		include In::Markdown
 		include In::Markdown::SpanLevelParser
 		include In::Markdown::BlockLevelParser
 	end
 end
 # This is the public interface
 class Maruku < MaRuKu::MDDocument; end
 require 'rexml/document'
 # Structures definition
 require 'maruku/structures'
 require 'maruku/structures_inspect'
 require 'maruku/defaults'
 # Less typing
 require 'maruku/helpers'
 # Code for parsing whole Markdown documents
 require 'maruku/input/parse_doc'
 # Ugly things kept in a closet
 require 'maruku/string_utils'
 require 'maruku/input/linesource'
 require 'maruku/input/type_detection'
 # A class for reading and sanitizing inline HTML
 require 'maruku/input/html_helper'
 # Code for parsing Markdown block-level elements
 require 'maruku/input/parse_block'
 # Code for parsing Markdown span-level elements
 require 'maruku/input/charsource'
 require 'maruku/input/parse_span_better'
 require 'maruku/input/rubypants'
 require 'maruku/input/extensions'
 require 'maruku/attributes'
 require 'maruku/structures_iterators'
 require 'maruku/errors_management'
 # Code for creating a table of contents
 require 'maruku/toc'
 # Version and URL
 require 'maruku/version'
 # Exporting to html
 require 'maruku/output/to_html'
 # Exporting to latex
 require 'maruku/output/to_latex'
 require 'maruku/output/to_latex_strings'
 require 'maruku/output/to_latex_entities'
 # Pretty print
 require 'maruku/output/to_markdown'
 # Exporting to text: strips all formatting (not complete)
 require 'maruku/output/to_s'
 # class Maruku is the global interface
 require 'maruku/maruku'
--- a/lib/maruku/attic/parse_span.rb.txt
+++ b/lib/maruku/attic/parse_span.rb.txt
@ -0,0 +1,462 @@
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #  NOTE: this is the old span-level regexp-based parser.
 #
 #  The new parser is a real parser and is defined with functions in parse_span_better.rb
 #  The new parser is faster, handles syntax errors, but it's absolutely not readable.
 #
 #  Also, regexp parsers simply CANNOT handle inline HTML properly.
 # There are two black-magic methods `match_couple_of` and `map_match`,
 # defined at the end of the file, that make the function 
 # `parse_lines_as_span` so elegant.
 class Maruku
 	# Takes care of all span-level formatting, links, images, etc.
 	#
 	# Lines must not contain block-level elements.
 	def parse_lines_as_span(lines)
 		# first, get rid of linebreaks
 		res = resolve_linebreaks(lines)
 		span = MDElement.new(:dummy, res)
 		# encode all escapes
 		span.replace_each_string { |s| s.escape_md_special }
 # The order of processing is significant: 
 # 1. inline code
 # 2. immediate links
 # 3. inline HTML 
 # 4. everything else
 		# search for ``code`` markers
 		span.match_couple_of('``') { |children, match1, match2| 
 			e = create_md_element(:inline_code)
 			# this is now opaque to processing
 			e.meta[:raw_code] = children.join('').it_was_a_code_block
 			e
 		}
 		# Search for `single tick`  code markers
 		span.match_couple_of('`') { |children, match1, match2|
 			e = create_md_element(:inline_code)
 			# this is now opaque to processing
 			e.meta[:raw_code] = children.join('').it_was_a_code_block
 			# this is now opaque to processing
 			e
 		}
 		# Detect any immediate link: <http://www.google.com>
 		# we expect an http: or something: at the beginning
 		span.map_match( /<(\w+:[^\>]+)>/) { |match| 
 			url = match[1]
 			e = create_md_element(:immediate_link, [])
 			e.meta[:url] = url
 			e
 		}
 		# Search for inline HTML (the support is pretty basic for now)
 		# this searches for a matching block
 		inlineHTML1 = %r{
 			(   # put everything in 1 
 			<   # open
 			(\w+) # opening tag in 2
 			>   # close
 			.*  # anything
 			</\2> # match closing tag
 			)
 		}x
 		# this searches for only one block
 		inlineHTML2 = %r{
 			(   # put everything in 1 
 			<   # open
 			\w+ # 
 			    # close
 			[^<>]*  # anything except
 			/> # closing tag
 			)
 		}x
 		for reg in [inlineHTML1, inlineHTML2]
 			span.map_match(reg) { |match| 
 				raw_html = match[1]
 				convert_raw_html_in_list(raw_html)
 			}
 		end
 		# Detect footnotes references: [^1]
 		span.map_match(/\[(\^[^\]]+)\]/) { |match| 
 			id = match[1].strip.downcase
 			e = create_md_element(:footnote_reference)
 			e.meta[:footnote_id] = id
 			e
 		}
 		# Detect any image like ![Alt text][url]
 		span.map_match(/\!\[([^\]]+)\]\s?\[([^\]]*)\]/) { |match|
 			alt = match[1]
 			id = match[2].strip.downcase
 			if id.size == 0
 				id = text.strip.downcase
 			end
 			e = create_md_element(:image)
 			e.meta[:ref_id] = id
 			e
 		}
 		# Detect any immage with immediate url: ![Alt](url "title")
 		# a dummy ref is created and put in the symbol table
 		link1 = /!\[([^\]]+)\]\s?\(([^\s\)]*)(?:\s+["'](.*)["'])?\)/
 		span.map_match(link1) { |match|
 			alt = match[1]
 			url = match[2]
 			title = match[3]
 			url = url.strip
 			# create a dummy id
 			id="dummy_#{@refs.size}"
 			@refs[id] = {:url=>url, :title=>title}
 			e = create_md_element(:image)
 			e.meta[:ref_id] = id
 			e
 		}
 		# an id reference: "[id]",  "[ id  ]"
 		reg_id_ref = %r{
 			\[ # opening bracket 
 			([^\]]*) # 0 or more non-closing bracket (this is too permissive)
 			\] # closing bracket
 			}x
 		# validates a url, only $1 is set to the url
 		reg_url = 
 			/((?:\w+):\/\/(?:\w+:{0,1}\w*@)?(?:\S+)(?::[0-9]+)?(?:\/|\/([\w#!:.?+=&%@!\-\/]))?)/
 		reg_url = %r{([^\s\]\)]+)}
 		# A string enclosed in quotes.
 		reg_title = %r{
 			" # opening
 			[^"]*   # anything = 1
 			" # closing
 			}x
 		# [bah](http://www.google.com "Google.com"), 
 		# [bah](http://www.google.com),
 		# [empty]()
 		reg_url_and_title = %r{
 			\(  # opening
 			\s* # whitespace 
 			#{reg_url}?  # url = 1 might be  empty
 			(?:\s+["'](.*)["'])? # optional title  = 2
 			\s* # whitespace 
 			\) # closing
 		}x
 		# Detect a link like ![Alt text][id]
 		span.map_match(/\[([^\]]+)\]\s?\[([^\]]*)\]/) { |match|
 			text = match[1]
 			id = match[2].strip.downcase
 			if id.size == 0
 				id = text.strip.downcase
 			end
 			children = parse_lines_as_span(text)
 			e = create_md_element(:link, children)
 			e.meta[:ref_id] = id
 			e
 		}
 		# Detect any immage with immediate url: ![Alt](url "title")
 		# a dummy ref is created and put in the symbol table
 		link1 = /!\[([^\]]+)\]\s?\(([^\s\)]*)(?:\s+["'](.*)["'])?\)/
 		span.map_match(link1) { |match|
 			text = match[1]
 			children = parse_lines_as_span(text)
 			url = match[2]
 			title = match[3]
 			url = url.strip
 			# create a dummy id
 			id="dummy_#{@refs.size}"
 			@refs[id] = {:url=>url, :title=>title}
 			@refs[id][:title] = title if title
 			e = create_md_element(:link, children)
 			e.meta[:ref_id] = id
 			e
 		}
 		# Detect any link like [Google engine][google]
 		span.match_couple_of('[',  # opening bracket
 			%r{\]                   # closing bracket
 			[ ]?                    # optional whitespace
 			#{reg_id_ref} # ref id, with $1 being the reference 
 			}x
 				) { |children, match1, match2| 
 			id = match2[1]
 			id = id.strip.downcase
 			if id.size == 0
 				id = children.join.strip.downcase
 			end
 			e = create_md_element(:link, children)
 			e.meta[:ref_id] = id
 			e
 		}
 		# Detect any link with immediate url: [Google](http://www.google.com)
 		# XXX Note that the url can be empty: [Empty]()
 		# a dummy ref is created and put in the symbol table
 		span.match_couple_of('[',  # opening bracket
 				%r{\]                   # closing bracket
 				[ ]?                    # optional whitespace
 				#{reg_url_and_title}    # ref id, with $1 being the url and $2 being the title
 				}x
 					) { |children, match1, match2| 
 			url   = match2[1]
 			title = match2[3] # XXX? Is it a bug? I would use [2]
 			# create a dummy id
 			id="dummy_#{@refs.size}"
 			@refs[id] = {:url=>url}
 			@refs[id][:title] = title if title
 			e = create_md_element(:link, children)
 			e.meta[:ref_id] = id
 			e
 		}
 		# Detect an email address <andrea@invalid.it>
 		span.map_match(EMailAddress) { |match| 
 			email = match[1]
 			e = create_md_element(:email_address, [])
 			e.meta[:email] = email
 			e
 		}
 		# Detect HTML entitis
 		span.map_match(/&([\w\d]+);/) { |match| 
 			entity_name = match[1]
 			e = create_md_element(:entity, [])
 			e.meta[:entity_name] = entity_name
 			e
 		}
 		# And now the easy stuff
 		# search for ***strong and em***
 		span.match_couple_of('***') { |children,m1,m2|  
 			create_md_element(:strong, [create_md_element(:emphasis, children)] ) }
 		span.match_couple_of('___') { |children,m1,m2|  
 			create_md_element(:strong, [create_md_element(:emphasis, children)] ) }
 		# search for **strong**
 		span.match_couple_of('**') { |children,m1,m2|  create_md_element(:strong,   children) }
 		# search for __strong__
 		span.match_couple_of('__') { |children,m1,m2|  create_md_element(:strong,   children) }
 		# search for *emphasis*
 		span.match_couple_of('*')  { |children,m1,m2|  create_md_element(:emphasis, children) }
 		# search for _emphasis_
 		span.match_couple_of('_')  { |children,m1,m2|  create_md_element(:emphasis, children) }
 		# finally, unescape the special characters
 		span.replace_each_string { |s|  s.unescape_md_special}
 		span.children
 	end
 	# returns array containing Strings or :linebreak elements
 	def resolve_linebreaks(lines)
 		res = []
 		s = ""
 		lines.each do |l| 
 			s += (s.size>0 ? " " : "") + l.strip
 			if force_linebreak?(l)
 				res << s
 				res << create_md_element(:linebreak)
 				s = ""
 			end
 		end
 		res << s if s.size > 0
 		res
 	end
 	# raw_html is something like 
 	#  <em> A</em> dopwkk *maruk* <em>A</em>  
 	def convert_raw_html_in_list(raw_html)
 		e = create_md_element(:raw_html)
 		e.meta[:raw_html]  = raw_html
 		begin
 			e.meta[:parsed_html] = Document.new(raw_html)
 		rescue 
 			$stderr.puts "convert_raw_html_in_list Malformed HTML:\n#{raw_html}"
 		end
 		e
 	end
 end
 # And now the black magic that makes the part above so elegant
 class MDElement	
 	# Try to match the regexp to each string in the hierarchy
 	# (using `replace_each_string`). If the regexp match, eliminate
 	# the matching string and substitute it with the pre_match, the
 	# result of the block, and the post_match
 	#
 	#   ..., matched_string, ... -> ..., pre_match, block.call(match), post_match
 	#
 	# the block might return arrays.
 	#
 	def map_match(regexp, &block)
 		replace_each_string { |s| 
 			processed = []
 			while (match = regexp.match(s))
 				# save the pre_match
 				processed << match.pre_match if match.pre_match && match.pre_match.size>0
 				# transform match
 				result = block.call(match)
 				# and append as processed
 				[*result].each do |e| processed << e end
 				# go on with the rest of the string
 				s = match.post_match 
 			end
 			processed << s if s.size > 0
 			processed
 		}
 	end
 	# Finds couple of delimiters in a hierarchy of Strings and MDElements
 	#
 	# Open and close are two delimiters (like '[' and ']'), or two Regexp.
 	#
 	# If you don't pass close, it defaults to open.
 	#
 	# Each block is called with |contained children, match1, match2|
 	def match_couple_of(open, close=nil, &block)
 		close = close || open
 		 open_regexp =  open.kind_of?(Regexp) ?  open : Regexp.new(Regexp.escape(open))
 		close_regexp = close.kind_of?(Regexp) ? close : Regexp.new(Regexp.escape(close))
 		# Do the same to children first
 		for c in @children; if c.kind_of? MDElement
 			c.match_couple_of(open_regexp, close_regexp, &block)
 		end end
 		processed_children = []
 		until @children.empty?
 			c = @children.shift
 			if c.kind_of? String
 				match1 = open_regexp.match(c)
 				if not match1
 					processed_children << c
 				else # we found opening, now search closing
 #					puts "Found opening (#{marker}) in #{c.inspect}"
 					# pre match is processed
 					processed_children.push match1.pre_match if 
 						match1.pre_match && match1.pre_match.size > 0
 					# we will process again the post_match
 					@children.unshift match1.post_match if 
 						match1.post_match && match1.post_match.size>0
 					contained = []; found_closing = false
 					until @children.empty?  || found_closing
 						c = @children.shift
 						if c.kind_of? String
 							match2 = close_regexp.match(c)
 							if not match2 
 								contained << c
 							else
 								# we found closing
 								found_closing = true
 								# pre match is contained
 								contained.push match2.pre_match if 
 									match2.pre_match && match2.pre_match.size>0
 								# we will process again the post_match
 								@children.unshift match2.post_match if 
 									match2.post_match && match2.post_match.size>0
 								# And now we call the block
 								substitute = block.call(contained, match1, match2) 
 								processed_children  << substitute
 #								puts "Found closing (#{marker}) in #{c.inspect}"
 #								puts "Children: #{contained.inspect}"
 #								puts "Substitute: #{substitute.inspect}"
 							end
 						else
 							contained << c
 						end
 					end
 					if not found_closing
 						# $stderr.puts "##### Could not find closing for #{open}, #{close} -- ignoring"
 						processed_children << match1.to_s
 						contained.reverse.each do |c|
 							@children.unshift c
 						end
 					end
 				end
 			else
 				processed_children << c
 			end
 		end
 		raise "BugBug" unless @children.empty?
 		rebuilt = []
 		# rebuild strings
 		processed_children.each do |c|
 			if c.kind_of?(String) && rebuilt.last && rebuilt.last.kind_of?(String)
 				rebuilt.last << c
 			else
 				rebuilt << c
 			end
 		end
 		@children = rebuilt
 	end
 end
--- a/lib/maruku/attributes.rb
+++ b/lib/maruku/attributes.rb
@ -0,0 +1,218 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 class String
 	def quote_if_needed
 		if /[\s\'\"]/.match self
 			inspect
 		else
 			self
 		end
 	end
 end
 module MaRuKu; 
 	MagicChar = ':'
 	class AttributeList < Array
 		# An attribute list becomes 
 		# {#id .cl key="val" ref}
 		# [ [:id, 'id'], [:class, 'id'], ['key', 'val'], [ :ref, 'ref' ]]
 		private :push
 		def push_key_val(key, val); 
 			raise "Bad #{key.inspect}=#{val.inspect}" if not key and val
 			push [key, val] 
 		end
 		def push_ref(ref_id);       
 			raise "Bad :ref #{ref_id.inspect}" if not ref_id
 			push [:ref, ref_id] 
 		end
 		def push_class(val);        
 			raise "Bad :id #{val.inspect}" if not val
 			push [:class,  val] 
 		end
 		def push_id(val);           
 			raise "Bad :id #{val.inspect}" if not val
 			push [:id,  val] 
 		end
 		def to_s
 			map do |k,v|
 				case k
 				when :id;    "#" + v.quote_if_needed
 				when :class; "." + v.quote_if_needed
 				when :ref;    v.quote_if_needed
 				else k.quote_if_needed + "=" + v.quote_if_needed
 				end
 			end . join(' ')
 		end
 		alias to_md to_s 
 	end
 end
 module MaRuKu; module In; module Markdown; module SpanLevelParser
 	def unit_tests_for_attribute_lists
 		[
 			[ "",     [], "Empty lists are allowed" ], 
 			[ "=",    :throw, "Bad char to begin a list with." ], 
 			[ "a =b", :throw, "No whitespace before `=`." ], 
 			[ "a= b", :throw, "No whitespace after `=`." ], 
 			[ "a b c", [[:ref, 'a'],[:ref, 'b'],[:ref, 'c']], "More than one ref" ], 
 			[ "hello notfound", [[:ref, 'hello'],[:ref, 'notfound']]], 
 			[ "'a'",  [[:ref, 'a']], "Quoted value." ], 
 			[ '"a"'   ], 
 			[ "a=b",  [['a','b']], "Simple key/val" ], 
 			[ "'a'=b"   ], 
 			[ "'a'='b'" ], 
 			[ "a='b'"   ], 
 			[ 'a="b\'"',  [['a',"b\'"]], "Key/val with quotes" ],
 			[ 'a=b\''],
 			[ 'a="\\\'b\'"',  [['a',"\'b\'"]], "Key/val with quotes" ], 
 			['"', :throw, "Unclosed quotes"],
 			["'"],
 			["'a "],
 			['"a '],
 			[ "#a",  [[:id, 'a']], "Simple ID" ], 
 			[ "#'a'" ], 
 			[ '#"a"' ], 
 			[ "#",  :throw, "Unfinished '#'." ], 
 			[ ".",  :throw, "Unfinished '.'." ], 
 			[ "# a",  :throw, "No white-space after '#'." ], 
 			[ ". a",  :throw, "No white-space after '.' ." ], 
 			[ "a=b c=d",  [['a','b'],['c','d']], "Tabbing" ], 
 			[ " \ta=b \tc='d' "],
 			[ "\t a=b\t c='d'\t\t"],
 			[ ".\"a'",  :throw, "Mixing quotes is bad." ], 
 		].map { |s, expected, comment| 
 			@expected = (expected ||= @expected)
 			@comment  = (comment  ||= (last=@comment) )
 			(comment == last && (comment += (@count+=1).to_s)) || @count = 1
 			expected = [md_ial(expected)] if expected.kind_of? Array
 			["{#{MagicChar}#{s}}", expected, "Attributes: #{comment}"]
 		}
 	end
 	def md_al(s=[]); AttributeList.new(s) end
 	# returns nil or an AttributeList
 	def read_attribute_list(src, con, break_on_chars)
 		separators = break_on_chars + [?=,?\ ,?\t]
 		escaped = Maruku::EscapedCharInQuotes
 		al = AttributeList.new
 		while true
 			src.consume_whitespace
 			break if break_on_chars.include? src.cur_char
 			case src.cur_char
 			when nil 
 				maruku_error "Attribute list terminated by EOF:\n "+
 				             "#{al.inspect}" , src, con
 				tell_user "I try to continue and return partial attribute list:\n"+
 					al.inspect
 				break
 			when ?=     # error
 				maruku_error "In attribute lists, cannot start identifier with `=`."
 				tell_user "I try to continue"
 				src.ignore_char
 			when ?#     # id definition
 				src.ignore_char
 				if id = read_quoted_or_unquoted(src, con, escaped, separators)
 					al.push_id id
 				else
 					maruku_error 'Could not read `id` attribute.', src, con
 					tell_user 'Trying to ignore bad `id` attribute.'
 				end
 			when ?.     # class definition
 				src.ignore_char
 				if klass = read_quoted_or_unquoted(src, con, escaped, separators)
 					al.push_class klass
 				else
 					maruku_error 'Could not read `class` attribute.', src, con
 					tell_user 'Trying to ignore bad `class` attribute.'
 				end
 			else
 				if key = read_quoted_or_unquoted(src, con, escaped, separators)
 					if src.cur_char == ?=
 						src.ignore_char # skip the =
 						if val = read_quoted_or_unquoted(src, con, escaped, separators)
 							al.push_key_val(key, val)
 						else
 							maruku_error "Could not read value for key #{key.inspect}.",
 								src, con
 							tell_user "Ignoring key #{key.inspect}."
 						end
 					else
 						al.push_ref key
 					end
 				else
 					maruku_error 'Could not read key or reference.'
 				end
 			end # case
 		end # while true
 		al
 	end
 	def merge_ial(elements, src, con)	
 		# We need a helper
 		def is_ial(e); e.kind_of? MDElement and e.node_type == :ial end
 		# Apply each IAL to the element before
 		elements.each_with_index do |e, i| 
 		if is_ial(e) && i>= 1 then
 			before = elements[i-1]
 			after = elements[i+1]
 			if before.kind_of? MDElement
 				before.al = e.ial
 			elsif after.kind_of? MDElement
 				after.al = e.ial
 			else
 				maruku_error "I don't know who you are referring to:"+
 					" {#{e.ial.to_md}}", src, con
 				# xxx dire se c'è empty vicino
 				maruku_recover "Ignoring IAL: {#{e.ial.to_md}}", src, con
 			end
 		end 
 		end
 		if not Globals[:debug_keep_ials]
 			elements.delete_if {|x| is_ial(x) unless x == elements.first} 
 		end
 	end
 end end end end 
 #module MaRuKu; module In; module Markdown; module SpanLevelParser
--- a/lib/maruku/defaults.rb
+++ b/lib/maruku/defaults.rb
@ -0,0 +1,52 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 module MaRuKu
 Globals = {
 	:unsafe_features => false,
 	:debug_keep_ials => false,
 	:maruku_signature => false,
 	:code_background_color => '#fef',
 	:code_show_spaces => false,
 	:html_math_engine => 'itex2mml', #ritex, itex2mml, none
 	:html_use_syntax => false,
 	:on_error => :warning
 }
 class MDElement
 	def get_setting(sym)
 		if self.attributes.has_key?(sym) then
 			return self.attributes[sym]
 		elsif self.doc && self.doc.attributes.has_key?(sym) then
 			return self.doc.attributes[sym]
 		elsif MaRuKu::Globals.has_key?(sym)
 			return MaRuKu::Globals[sym]
 		else
 			$stderr.puts "Bug: no default for #{sym.inspect}"
 			nil
 		end
 	end
 end
 end
--- a/lib/maruku/errors_management.rb
+++ b/lib/maruku/errors_management.rb
@ -0,0 +1,92 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 #m  Any method that detects formatting error calls the
 #m  maruku_error() method. 
 #m  if @meta[:on_error] == 
 #m
 #m  - :warning   write on the standard err (or @error_stream if defined), 
 #m              then do your best.
 #m  - :ignore    be shy and try to continue
 #m  - :raise     raises a MarukuException
 #m
 #m  default is :raise
 module MaRuKu
 	class Exception < RuntimeError
 	end
 module Errors
 	def maruku_error(s,src=nil,con=nil)
 		policy = get_setting(:on_error)
 		case policy
 		when :ignore 
 		when :raise
 			raise_error create_frame(describe_error(s,src,con))
 		when :warning
 			tell_user create_frame(describe_error(s,src,con))
 		else
 			raise "BugBug: policy = #{policy.inspect}"
 		end
 	end
 	def maruku_recover(s,src=nil,con=nil)
 		tell_user create_frame(describe_error(s,src,con))
 	end
 	alias error maruku_error
 	def raise_error(s)
 		raise MaRuKu::Exception, s, caller
 	end
 	def tell_user(s)
 		error_stream = self.attributes[:error_stream] || $stderr
 		error_stream << s 
 	end
 	def create_frame(s)
 		n = 75
 		"\n" +
 		" "+"_"*n << "\n"<<
 		"| Maruku tells you:\n" << 
 		"+"+"-"*n +"\n"+
 		add_tabs(s,1,'| ') << "\n" <<
 		"+" << "-"*n << "\n" <<
 		add_tabs(caller[0, 5].join("\n"),1,'!') << "\n" <<
 		"\\" << "_"*n << "\n"
 	end
 	def describe_error(s,src,con)
 		t = s
 		src && (t += "\n#{src.describe}\n")
 		con && (t += "\n#{con.describe}\n")
 		t
 	end
 end # Errors
 end # MaRuKu
--- a/lib/maruku/ext/math.rb
+++ b/lib/maruku/ext/math.rb
@ -0,0 +1,10 @@
 require 'maruku/ext/math/elements'
 require 'maruku/ext/math/parsing'
 require 'maruku/ext/math/to_latex'
 require 'maruku/ext/math/to_html'
 require 'maruku/ext/math/mathml_engines/none'
 require 'maruku/ext/math/mathml_engines/ritex'
 require 'maruku/ext/math/mathml_engines/itex2mml'
--- a/lib/maruku/ext/math/elements.rb
+++ b/lib/maruku/ext/math/elements.rb
@ -0,0 +1,26 @@
 module MaRuKu; class MDElement
 	def md_inline_math(math)
 		self.md_el(:inline_math, [], meta={:math=>math})
 	end
 	def md_equation(math, label=nil)
 		reglabel= /\\label\{(\w+)\}/
 		if math =~ reglabel
 			label = $1
 			math.gsub!(reglabel,'')
 		end
 #		puts "Found label = #{label} math #{math.inspect} "
 		num = nil
 		if label && @doc #take number
 			@doc.eqid2eq ||= {}	
 			num = @doc.eqid2eq.size + 1
 		end
 		e = self.md_el(:equation, [], meta={:math=>math, :label=>label,:num=>num})
 		if label && @doc #take number
 			@doc.eqid2eq[label] = e
 		end
 		e
 	end
 end end
--- a/lib/maruku/ext/math/mathml_engines/itex2mml.rb
+++ b/lib/maruku/ext/math/mathml_engines/itex2mml.rb
@ -0,0 +1,35 @@
 module MaRuKu; module Out; module HTML
 	def convert_to_mathml_itex2mml(tex, method)
 		begin
 			if not $itex2mml_parser
 				require 'itextomml'
 				$itex2mml_parser =  Itex2MML::Parser.new
 			end
 			mathml =  $itex2mml_parser.send(method, tex)
 			doc = Document.new(mathml, {:respect_whitespace =>:all}).root
 			return doc
 		rescue LoadError => e
 			maruku_error "Could not load package 'itex2mml'.\n"+
 			"Please install it."
 		rescue REXML::ParseException => e
 			maruku_error "Invalid MathML TeX: \n#{add_tabs(tex,1,'tex>')}"+
 				"\n\n #{e.inspect}"
 		rescue 
 			maruku_error "Could not produce MathML TeX: \n#{tex}"+
 				"\n\n #{e.inspect}"
 		end
 		nil
 	end
 	def to_html_inline_math_itex2mml
 		convert_to_mathml_itex2mml(self.math, :inline_filter) 
 	end
 	def to_html_equation_itex2mml
 		convert_to_mathml_itex2mml(self.math, :block_filter)
 	end
 end end end
--- a/lib/maruku/ext/math/mathml_engines/none.rb
+++ b/lib/maruku/ext/math/mathml_engines/none.rb
@ -0,0 +1,20 @@
 module MaRuKu; module Out; module HTML
 	def to_html_inline_math_none
 		# You can: either return a REXML::Element
 		#    return Element.new 'div'    
 		# or return an empty array on error
 		#    return []  
 		# or have a string parsed by REXML:
 		tex = self.math
 		tex.gsub!('&','&amp;')
 		mathml = "<code>#{tex}</code>"
 		return Document.new(mathml).root
 	end
 	def to_html_equation_none
 		return to_html_inline_math_none
 	end
 end end end
--- a/lib/maruku/ext/math/mathml_engines/ritex.rb
+++ b/lib/maruku/ext/math/mathml_engines/ritex.rb
@ -0,0 +1,34 @@
 module MaRuKu; module Out; module HTML
 	def convert_to_mathml_ritex(tex)
 		begin
 			if not $ritex_parser
 				require 'ritex'
 			 	$ritex_parser = Ritex::Parser.new
 			end
 			mathml =  $ritex_parser.parse(tex.strip)
 			doc = Document.new(mathml, {:respect_whitespace =>:all}).root
 			return doc
 		rescue LoadError => e
 			maruku_error "Could not load package 'ritex'.\n"+
 			"Please install it using:\n"+
 			"   $ gem install ritex\n\n"+e.inspect
 		rescue Racc::ParseError => e
 			maruku_error "Could not parse TeX: \n#{tex}"+
 				"\n\n #{e.inspect}"
 		end
 		nil
 	end
 	def to_html_inline_math_ritex
 		tex = self.math
 		mathml = convert_to_mathml_ritex(tex)
 		return mathml || []
 	end
 	def to_html_equation_ritex
 		tex = self.math
 		mathml = convert_to_mathml_ritex(tex)
 		return mathml || []
 	end
 end end end
--- a/lib/maruku/ext/math/parsing.rb
+++ b/lib/maruku/ext/math/parsing.rb
@ -0,0 +1,82 @@
 module MaRuKu
 	class MDDocument
 		# Hash equation id (String) to equation element (MDElement)
 		attr_accessor :eqid2eq
 	end
 end
 	# At least one slash inside
 	#RegInlineMath1 = /\$([^\$]*[\\][^\$]*)\$/
 	# No spaces around the delimiters
 	#RegInlineMath2 = /\$([^\s\$](?:[^\$]*[^\s\$])?)\$/
 	#RegInlineMath = Regexp::union(RegInlineMath1,RegInlineMath2)
 	# Everything goes; takes care of escaping the "\$" inside the expression
 	RegInlineMath = /\${1}((?:[^\$]|\\\$)+)\$/
 	MaRuKu::In::Markdown::
 	register_span_extension(:chars => ?$, :regexp => RegInlineMath) do 
 		|doc, src, con|
 		if m = src.read_regexp(RegInlineMath)
 			math = m.captures.compact.first
 			con.push doc.md_inline_math(math)
 			true
 		else
 			#puts "not math: #{src.cur_chars 10}"
 			false
 		end
 	end
 	EquationStart = /^[ ]{0,3}(?:\\\[|\$\$)(.*)$/
 	EqLabel = /(?:\((\w+)\))/
 	OneLineEquation = /^[ ]{0,3}(?:\\\[|\$\$)(.*)(?:\\\]|\$\$)\s*#{EqLabel}?\s*$/
 	EquationEnd = /^(.*)(?:\\\]|\$\$)\s*#{EqLabel}?\s*$/
 	MaRuKu::In::Markdown::
 	register_block_extension(:regexp  => EquationStart) do |doc, src, con|
 #		puts "Equation :#{self}"
 		first = src.shift_line
 		if first =~ OneLineEquation
 			math = $1
 			label = $2 
 			con.push doc.md_equation($1, $2)
 		else
 			first =~ EquationStart
 			math = $1
 			label = nil
 			while true
 				if not src.cur_line
 					maruku_error "Stream finished while reading equation\n\n"+
 					add_tabs(math,1,'$> '), src, con
 					break
 				end
 				line = src.shift_line
 				if line =~ EquationEnd
 					math += $1 + "\n"
 					label = $2 if $2
 					break
 				else
 					math += line + "\n"
 				end
 			end
 			con.push doc.md_equation(math, label)
 		end
 		true
 	end
 	# This adds support for \eqref
 	RegEqrefLatex = /\\eqref\{(\w+)\}/
 	RegEqPar = /\(eq:(\w+)\)/
 	RegEqref = Regexp::union(RegEqrefLatex, RegEqPar)
 	MaRuKu::In::Markdown::
 	register_span_extension(:chars => [?\\, ?(], :regexp => RegEqref) do 
 		|doc, src, con|
 		eqid = src.read_regexp(RegEqref).captures.compact.first
 		r = doc.md_el(:eqref, [], meta={:eqid=>eqid})
 		con.push r
 	 	true 
 	end
--- a/lib/maruku/ext/math/to_html.rb
+++ b/lib/maruku/ext/math/to_html.rb
@ -0,0 +1,107 @@
 =begin maruku_doc
 Attribute: html_math_engine
 Scope: document, element
 Output: html
 Summary: Select the rendering engine for math.
 Default: <?mrk Globals[:html_math_engine].to_s ?>
 Select the rendering engine for math.
 If you want to use your engine `foo`, then set:
 	HTML math engine: foo
 {:lang=markdown}
 and then implement two functions:
 	def to_html_inline_math_foo
 		# You can: either return a REXML::Element
 		#    return Element.new 'div'    
 		# or return an empty array on error
 		#    return []  
 		# or have a string parsed by REXML:
 		tex = self.math
 		tex.gsub!('&','&amp;')
 		mathml = "<code>#{tex}</code>"
 		return Document.new(mathml).root
 	end
 	def to_html_equation_foo
 		# same thing
 		...
 	end
 {:lang=ruby}
 =end
 module MaRuKu; module Out; module HTML
 	def to_html_inline_math
 		s = get_setting(:html_math_engine)
 		method = "to_html_inline_math_#{s}".to_sym
 		if self.respond_to? method
 			self.send method ||  to_html_equation_none
 		else 
 			puts "A method called #{method} should be defined."
 			return []
 		end
 	end
 	def add_class_to(el, cl)
 		el.attributes['class'] = 
 		if already = el.attributes['class']
 			already + " " + cl
 		else
 			cl
 		end
 	end
 	def to_html_equation
 		s = get_setting(:html_math_engine)
 		method = "to_html_equation_#{s}".to_sym
 		if self.respond_to? method
 			mathml = self.send(method) || to_html_equation_none
 			div = create_html_element 'div'
 			add_class_to(div, 'maruku-equation')
 				if self.label # then numerate
 					span = Element.new 'span'
 					span.attributes['class'] = 'maruku-eq-number'
 					num = self.num
 					span << Text.new("(#{num})")
 					div << span
 					div.attributes['id'] = "eq:#{self.label}"
 				end
 				div << mathml
 				source_div = Element.new 'div'
 					add_class_to(source_div, 'maruku-eq-tex')
 					code = to_html_equation_none	
 					code.attributes['style'] = 'display: none'
 				source_div << code
 				div << source_div
 			div
 		else 
 			puts "A method called #{method} should be defined."
 			return []
 		end
 	end
 	def to_html_eqref
 		if eq = self.doc.eqid2eq[self.eqid]
 			num = eq.num
 			a = Element.new 'a'
 			a.attributes['class'] = 'maruku-eqref'
 			a.attributes['href'] = "#eq:#{self.eqid}"
 			a << Text.new("(#{num})")
 			a
 		else
 			maruku_error "Cannot find equation #{self.eqid.inspect}"
 			Text.new "(#{self.eqid})"
 		end
 	end
 end end end
--- a/lib/maruku/ext/math/to_latex.rb
+++ b/lib/maruku/ext/math/to_latex.rb
@ -0,0 +1,21 @@
 module MaRuKu; module Out; module Latex
 	def to_latex_inline_math
 		"$#{self.math.strip}$"
 	end
 	def to_latex_equation
 		if self.label
 			l =  "\\label{#{self.label}}"
 			"\\begin{equation}\n#{self.math.strip}\n#{l}\\end{equation}\n"
 		else
 			"\\begin{displaymath}\n#{self.math.strip}\n\\end{displaymath}\n"
 		end
 	end
 	def to_latex_eqref
 		"\\eqref{#{self.eqid}}"
 	end
 end end end
--- a/lib/maruku/helpers.rb
+++ b/lib/maruku/helpers.rb
@ -0,0 +1,259 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 # A series of helper functions for creating elements: they hide the 
 # particular internal representation.
 #
 # Please, always use these instead of creating MDElement.
 #
 module MaRuKu
 module Helpers
 	# if the first is a md_ial, it is used as such
 	def md_el(node_type, children=[], meta={}, al=nil)
 		if  (e=children.first).kind_of?(MDElement) and 
 			e.node_type == :ial then
 			if al
 				al += e.ial
 			else
 				al = e.ial
 			end
 			children.shift
 		end 
 		e = MDElement.new(node_type, children, meta, al)
 		e.doc = @doc
 		return e
 	end
 	def md_header(level, children, al=nil)
 		md_el(:header, children, {:level => level}, al)
 	end
 	# Inline code
 	def md_code(code, al=nil)
 		md_el(:inline_code, [], {:raw_code => code}, al)
 	end
 	# Code block
 	def md_codeblock(source, al=nil)
 		md_el(:code, [], {:raw_code => source}, al)
 	end
 	def md_quote(children, al=nil)
 		md_el(:quote, children, {}, al)
 	end
 	def md_li(children, want_my_par, al=nil)
 		md_el(:li, children, {:want_my_paragraph=>want_my_par}, al)
 	end
 	def md_footnote(footnote_id, children, al=nil)
 		md_el(:footnote, children, {:footnote_id=>footnote_id}, al)
 	end
 	def md_abbr_def(abbr, text, al=nil)
 		md_el(:abbr_def, [], {:abbr=>abbr, :text=>text}, al)
 	end
 	def md_abbr(abbr, title)
 		md_el(:abbr, [abbr], {:title=>title})
 	end
 	def md_html(raw_html, al=nil)
 		e = md_el(:raw_html, [], {:raw_html=>raw_html})
 		begin
 			# remove newlines and whitespace at begin
 			# end end of string, or else REXML gets confused
 			raw_html = raw_html.gsub(/\A\s*</,'<').
 			                    gsub(/>[\s\n]*\Z/,'>')
 			raw_html = "<marukuwrap>#{raw_html}</marukuwrap>"
 			e.instance_variable_set :@parsed_html,
 			 	REXML::Document.new(raw_html)
 		rescue 
 #			tell_user "Malformed block of HTML:\n"+
 #			add_tabs(raw_html,1,'|')
 #			"  #{raw_html.inspect}\n\n"+ex.inspect
 		end
 		e
 	end
 	def md_link(children, ref_id, al=nil)
 		md_el(:link, children, {:ref_id=>ref_id.downcase}, al)
 	end
 	def md_im_link(children, url, title=nil, al=nil)
 		md_el(:im_link, children, {:url=>url,:title=>title}, al)
 	end
 	def md_image(children, ref_id, al=nil)
 		md_el(:image, children, {:ref_id=>ref_id}, al)
 	end
 	def md_im_image(children, url, title=nil, al=nil)
 		md_el(:im_image, children, {:url=>url,:title=>title},al)
 	end
 	def md_em(children, al=nil)
 		md_el(:emphasis, [children].flatten, {}, al)
 	end
 	def md_br()
 		md_el(:linebreak, [], {}, nil)
 	end
 	def md_hrule()
 		md_el(:hrule, [], {}, nil)
 	end
 	def md_strong(children, al=nil)
 		md_el(:strong, [children].flatten, {}, al)
 	end
 	def md_emstrong(children, al=nil)
 		md_strong(md_em(children), al)
 	end
 	# <http://www.example.com/>
 	def md_url(url, al=nil)
 		md_el(:immediate_link, [], {:url=>url}, al)
 	end
 	# <andrea@rubyforge.org>
 	# <mailto:andrea@rubyforge.org>
 	def md_email(email, al=nil)
 		md_el(:email_address, [], {:email=>email}, al)
 	end
 	def md_entity(entity_name, al=nil)
 		md_el(:entity, [], {:entity_name=>entity_name}, al)
 	end
 	# Markdown extra
 	def md_foot_ref(ref_id, al=nil)
 		md_el(:footnote_reference, [], {:footnote_id=>ref_id}, al)
 	end
 	def md_par(children, al=nil)
 		md_el(:paragraph, children, meta={}, al)
 	end
 	# [1]: http://url [properties]
 	def md_ref_def(ref_id, url, title=nil, meta={}, al=nil)
 		meta[:url] = url
 		meta[:ref_id] = ref_id
 		meta[:title] = title if title
 		md_el(:ref_definition, [], meta, al)
 	end
 	# inline attribute list
 	def md_ial(al)
 		al = Maruku::AttributeList.new(al) if 
 			not al.kind_of?Maruku::AttributeList
 		md_el(:ial, [], {:ial=>al})
 	end
 	# Attribute list definition
 	def md_ald(id, al)
 		md_el(:ald, [], {:ald_id=>id,:ald=>al})
 	end
 	# Server directive <?target code... ?>
 	def md_xml_instr(target, code)
 		md_el(:xml_instr, [], {:target=>target, :code=>code})
 	end
 end
 end
 module MaRuKu
 class MDElement	
 	# outputs abbreviated form  (this should be eval()uable to get the document)
 	def inspect2 
 		s = 
 		case @node_type
 		when :paragraph
 			"md_par(%s)" % children_inspect
 		when :footnote_reference
 			"md_foot_ref(%s)" % self.footnote_id.inspect
 		when :entity
 			"md_entity(%s)" % self.entity_name.inspect
 		when :email_address
 			"md_email(%s)" % self.email.inspect
 		when :inline_code
 			"md_code(%s)" % self.raw_code.inspect
 		when :raw_html
 			"md_html(%s)" % self.raw_html.inspect
 		when :emphasis 
 			"md_em(%s)" % children_inspect
 		when :strong
 			"md_strong(%s)" % children_inspect
 		when :immediate_link
 			"md_url(%s)" % self.url.inspect
 		when :image
 			"md_image(%s, %s)" % [
 				children_inspect, 
 				self.ref_id.inspect]
 		when :im_image
 			"md_im_image(%s, %s, %s)" % [
 				children_inspect, 
 				self.url.inspect,
 				self.title.inspect]
 		when :link
 				"md_link(%s,%s)" % [
 					children_inspect, self.ref_id.inspect]
 		when :im_link
 				"md_im_link(%s, %s, %s)" % [
 					children_inspect, 
 					self.url.inspect,
 					self.title.inspect,
 				]
 		when :ref_definition
 			"md_ref_def(%s, %s, %s)" % [
 					self.ref_id.inspect, 
 					self.url.inspect,
 					self.title.inspect
 				]
 		when :ial
 			"md_ial(%s)" % self.ial.inspect
 		else
 			return nil
 		end
 		if @al and not @al.empty? then 
 			s = s.chop + ", #{@al.inspect})"
 		end
 		s
 	end
 end
 end
--- a/lib/maruku/input/charsource.rb
+++ b/lib/maruku/input/charsource.rb
@ -0,0 +1,325 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 module MaRuKu; module In; module Markdown; module SpanLevelParser
 # a string scanner coded by me
 class CharSourceManual; end
 # a wrapper around StringScanner
 class CharSourceStrscan; end
 # A debug scanner that checks the correctness of both
 # by comparing their output
 class CharSourceDebug; end
 # Choose!
 CharSource = CharSourceManual     # faster! 58ms vs. 65ms
 #CharSource = CharSourceStrscan
 #CharSource = CharSourceDebug
 class CharSourceManual
 	include MaRuKu::Strings
 	def initialize(s, parent=nil)
 		raise "Passed #{s.class}" if not s.kind_of? String
 		@buffer = s
 		@buffer_index = 0
 		@parent = parent
 	end
 	# Return current char as a FixNum (or nil).
 	def cur_char; @buffer[@buffer_index]   end
 	# Return the next n chars as a String.
 	def cur_chars(n); @buffer[@buffer_index,n]  end
 	# Return the char after current char as a FixNum (or nil).
 	def next_char; @buffer[@buffer_index+1] end
 	def shift_char
 		c = @buffer[@buffer_index]
 		@buffer_index+=1
 		c
 	end
 	def ignore_char
 		@buffer_index+=1
 		nil
 	end
 	def ignore_chars(n)
 		@buffer_index+=n
 		nil
 	end
 	def current_remaining_buffer
 		@buffer[@buffer_index, @buffer.size-@buffer_index]
 	end
 	def cur_chars_are(string)
 		# There is a bug here
 		if false
 			r2 = /^.{#{@buffer_index}}#{Regexp.escape string}/m
 			@buffer =~ r2
 		else
 			cur_chars(string.size) == string
 		end
 	end
 	def next_matches(r)
 		r2 = /^.{#{@buffer_index}}#{r}/m
 		md = r2.match @buffer
 		return !!md
 	end
 	def read_regexp3(r)
 		r2 = /^.{#{@buffer_index}}#{r}/m
 		m = r2.match @buffer
 		if m
 			consumed = m.to_s.size - @buffer_index
 #			puts "Consumed #{consumed} chars (entire is #{m.to_s.inspect})"
 			ignore_chars consumed
 		else
 #			puts "Could not read regexp #{r2.inspect} from buffer "+
 #			" index=#{@buffer_index}"
 #			puts "Cur chars = #{cur_chars(20).inspect}"
 #			puts "Matches? = #{cur_chars(20) =~ r}"
 		end
 		m
 	end
 		def read_regexp(r)
 			r2 = /^#{r}/
 			rest = current_remaining_buffer
 			m = r2.match(rest)
 			if m
 				@buffer_index += m.to_s.size
 #				puts "#{r} matched #{rest.inspect}: #{m.to_s.inspect}"
 			end
 			return m
 		end
 	def consume_whitespace
 		while c = cur_char 
 			if (c == 32 || c == ?\t)
 #				puts "ignoring #{c}"
 				ignore_char
 			else
 #				puts "#{c} is not ws: "<<c
 				break
 			end
 		end
 	end
 	def read_text_chars(out)
 		s = @buffer.size; c=nil
 		while @buffer_index < s && (c=@buffer[@buffer_index]) &&
 			 ((c>=?a && c<=?z) || (c>=?A && c<=?Z))
 				out << c
 				@buffer_index += 1
 		end
 	end
 	def describe
 		s = describe_pos(@buffer, @buffer_index)
 		if @parent
 			s += "\n\n" + @parent.describe
 		end
 		s
 	end
 	include SpanLevelParser
 end
 def describe_pos(buffer, buffer_index)
 	len = 75
 	num_before = [len/2, buffer_index].min
 	num_after = [len/2, buffer.size-buffer_index].min
 	num_before_max = buffer_index
 	num_after_max = buffer.size-buffer_index
 #		puts "num #{num_before} #{num_after}"
 	num_before = [num_before_max, len-num_after].min
 	num_after  = [num_after_max, len-num_before].min
 #		puts "num #{num_before} #{num_after}"
 	index_start = [buffer_index - num_before, 0].max
 	index_end   = [buffer_index + num_after, buffer.size].min
 	size = index_end- index_start
 #		puts "- #{index_start} #{size}"
 	str = buffer[index_start, size]
 	str.gsub!("\n",'N')
 	str.gsub!("\t",'T')
 	if index_end == buffer.size 
 		str += "EOF"
 	end
 	pre_s = buffer_index-index_start
 	pre_s = [pre_s, 0].max
 	pre_s2 = [len-pre_s,0].max
 #		puts "pre_S = #{pre_s}"
 	pre =" "*(pre_s) 
 	"-"*len+"\n"+
 	str + "\n" +
 	"-"*pre_s + "|" + "-"*(pre_s2)+"\n"+
 #		pre + "|\n"+
 	pre + "+--- Byte #{buffer_index}\n"+
 	"Shown bytes [#{index_start} to #{size}] of #{buffer.size}:\n"+
 	add_tabs(buffer,1,">")
 #		"CharSource: At character #{@buffer_index} of block "+
 #		" beginning with:\n    #{@buffer[0,50].inspect} ...\n"+
 #		" before: \n     ... #{cur_chars(50).inspect} ... "
 end
 require 'strscan'
 class CharSourceStrscan
 	include SpanLevelParser
 	include MaRuKu::Strings
 	def initialize(s)
 		@s = StringScanner.new(s)
 	end
 	# Return current char as a FixNum (or nil).
 	def cur_char
 		 @s.peek(1)[0]
 	end
 	# Return the next n chars as a String.
 	def cur_chars(n); 
 		@s.peek(n)
 	end
 	# Return the char after current char as a FixNum (or nil).
 	def next_char; 
 		@s.peek(2)[1]
 	end
 	def shift_char
 		(@s.get_byte)[0]
 	end
 	def ignore_char
 		@s.get_byte
 		nil
 	end
 	def ignore_chars(n)
 		n.times do @s.get_byte end
 		nil
 	end
 	def current_remaining_buffer
 		@s.rest #nil #@buffer[@buffer_index, @buffer.size-@buffer_index]
 	end
 	def cur_chars_are(string)
 		cur_chars(string.size) == string
 	end
 	def next_matches(r)
 		len = @s.match?(r)
 		return !!len
 	end
 	def read_regexp(r)
 		string = @s.scan(r)
 		if string
 			return r.match(string)
 		else
 			return nil
 		end
 	end
 	def consume_whitespace
 		@s.scan /\s+/
 		nil
 	end
 	def describe
 		describe_pos(@s.string, @s.pos)
 	end
 end
 class CharSourceDebug
 	def initialize(s)
 		@a = CharSourceManual.new(s)
 		@b = CharSourceStrscan.new(s)
 	end
 	def method_missing(methodname, *args)
 		a_bef = @a.describe
 		b_bef = @b.describe
 		a = @a.send(methodname, *args)
 		b = @b.send(methodname, *args)
 #		if methodname == :describe
 #			return a
 #		end
 		if a.kind_of? MatchData
 			if a.to_a != b.to_a
 				puts "called: #{methodname}(#{args})"
 				puts "Matchdata:\na = #{a.to_a.inspect}\nb = #{b.to_a.inspect}"
 				puts "AFTER: "+@a.describe
 				puts "AFTER: "+@b.describe
 				puts "BEFORE: "+a_bef
 				puts "BEFORE: "+b_bef
 				puts caller.join("\n")
 				exit
 			end
 		else
 			if a!=b
 				puts "called: #{methodname}(#{args})"
 				puts "Attenzione!\na = #{a.inspect}\nb = #{b.inspect}"
 				puts ""+@a.describe
 				puts ""+@b.describe
 				puts caller.join("\n")
 				exit
 			end
 		end
 		if @a.cur_char != @b.cur_char
 			puts "Fuori sincronia dopo #{methodname}(#{args})"
 			puts ""+@a.describe
 			puts ""+@b.describe
 			exit
 		end
 		return a
 	end
 end
 end end end end
--- a/lib/maruku/input/extensions.rb
+++ b/lib/maruku/input/extensions.rb
@ -0,0 +1,68 @@
 module MaRuKu; module In; module Markdown
 	# Hash Fixnum -> name
 	SpanExtensionsTrigger = {}
 	class SpanExtension
 		# trigging chars
 		attr_accessor :chars
 		# trigging regexp
 		attr_accessor :regexp
 		# lambda
 		attr_accessor :block
 	end
 	# Hash String -> Extension
 	SpanExtensions = {}
 	def check_span_extensions(src, con)
 		c = src.cur_char
 		if extensions = SpanExtensionsTrigger[c]
 			extensions.each do |e|
 				if e.regexp && (match = src.next_matches(e.regexp))
 					return true if e.block.call(doc, src, con)
 				end
 			end
 		end
 		return false # not special
 	end
 	def self.register_span_extension(args, &block)
 		e = SpanExtension.new
 		e.chars = [*args[:chars]]
 		e.regexp = args[:regexp]
 		e.block = block
 		e.chars.each do |c|
 			(SpanExtensionsTrigger[c] ||= []).push e
 		end
 	end
 	def self.register_block_extension(args, &block)
 		regexp = args[:regexp]
 		BlockExtensions[regexp] = block
 	end
 	# Hash Regexp -> Block
 	BlockExtensions = {}
 	def check_block_extensions(src, con, line)
 		BlockExtensions.each do |reg, block|
 			if m = reg.match(line)
 				block = BlockExtensions[reg]
 				return true if block.call(doc, src, con)
 			end
 		end
 		return false # not special
 	end
 	def any_matching_block_extension?(line)
 		BlockExtensions.each_key do |reg|
 			m = reg.match(line)
 			return m if m
 		end
 		return false
 	end
 end end end
--- a/lib/maruku/input/html_helper.rb
+++ b/lib/maruku/input/html_helper.rb
@ -0,0 +1,144 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 module MaRuKu; module In; module Markdown; module SpanLevelParser
 # This class helps me read and sanitize HTML blocks
 # I tried to do this with REXML, but wasn't able to. (suggestions?)
 	class HTMLHelper
 		include MaRuKu::Strings
 		Tag = %r{^<(/)?(\w+)\s*([^>]*)>}m
 		EverythingElse = %r{^[^<]+}m
 		CommentStart = %r{^<!--}x
 		CommentEnd = %r{^.*-->}
 		TO_SANITIZE = ['img','hr'] 
 #		attr_accessor :inside_comment
 		attr_reader :rest
 		def initialize 
 			@rest = ""
 			@tag_stack = []
 			@m = nil
 			@already = ""
 			@inside_comment = false
 		end
 		def eat_this(line)
 			@rest = line  + @rest
 			things_read = 0
 			until @rest.empty?
 				if @inside_comment
 					if @m = CommentEnd.match(@rest)
 						@inside_comment = false
 						@already += @m.pre_match + @m.to_s
 						@rest = @m.post_match
 					elsif @m = EverythingElse.match(@rest)
 						@already += @m.pre_match + @m.to_s
 						@rest = @m.post_match
 					end
 				else
 					if @m = CommentStart.match(@rest)
 						things_read += 1
 						@inside_comment = true
 						@already += @m.pre_match + @m.to_s
 						@rest = @m.post_match
 					elsif @m = Tag.match(@rest)
 						things_read += 1
 						@already += @m.pre_match
 						@rest = @m.post_match
 						is_closing = !!@m[1]
 						tag = @m[2]
 						attributes = @m[3]
 						is_single = false
 						if attributes =~ /\A(.*)\/\Z/
 							attributes = $1
 							is_single = true
 						end
 						if TO_SANITIZE.include? tag 
 							attributes.strip!
 					#		puts "Attributes: #{attributes.inspect}"
 							if attributes.size > 0
 								@already +=  '<%s %s />' % [tag, attributes]
 							else
 								@already +=  '<%s />' % [tag]
 							end
 						elsif is_closing
 							@already += @m.to_s
 							if @tag_stack.empty?
 								error "Malformed: closing tag #{tag.inspect} "+
 								      "in empty list"
 							end 
 							if @tag_stack.last != tag
 								error "Malformed: tag <#{tag}> "+
 								      "closes <#{@tag_stack.last}>"
 							end
 							@tag_stack.pop
 						elsif not is_single
 							@tag_stack.push tag
 							@already += @m.to_s
 						end
 					elsif @m = EverythingElse.match(@rest)
 						@already += @m.pre_match + @m.to_s
 						@rest = @m.post_match
 					else
 						error "Malformed HTML: not complete: #{@rest.inspect}"
 					end
 				end # not inside comment
 #				puts inspect
 #				puts "Read: #{@tag_stack.inspect}"
 				break if is_finished? and things_read>0	
 			end
 		end
 		def error(s)
 			raise Exception, "Error: #{s} \n"+ inspect, caller
 		end
 		def inspect; "HTML READER\n comment=#{@inside_comment} "+
 			"match=#{@m.to_s.inspect}\n"+
 			"Tag stack = #{@tag_stack.inspect} \n"+
 			"Before:\n"+
 			add_tabs(@already,1,'|')+"\n"+
 			"After:\n"+
 			add_tabs(@rest,1,'|')+"\n"
 		end
 		def stuff_you_read
 			@already
 		end
 		def is_finished?
 			not @inside_comment and @tag_stack.empty?
 		end
 	end # html helper 
 end end end end
--- a/lib/maruku/input/linesource.rb
+++ b/lib/maruku/input/linesource.rb
@ -0,0 +1,111 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 module MaRuKu; module In; module Markdown; module BlockLevelParser
 # This represents a source of lines that can be consumed.
 #
 # It is the twin of CharSource.
 #
 class LineSource
 	include MaRuKu::Strings
 	def initialize(lines, parent=nil, parent_offset=nil)
 		raise "NIL lines? " if not lines
 		@lines = lines
 		@lines_index = 0
 		@parent = parent
 		@parent_offset = parent_offset
 	end
 	def cur_line()  @lines[@lines_index] end
 	def next_line() @lines[@lines_index+1] end
 	def shift_line() 
 		raise "Over the rainbow" if @lines_index >= @lines.size 
 		l = @lines[@lines_index]
 		@lines_index += 1
 		return l
 	end
 	def ignore_line
 		raise "Over the rainbow" if @lines_index >= @lines.size 
 		@lines_index += 1
 	end
 	def describe
 		#s = "At line ##{@lines_index} of #{@lines.size}:\n"
 		s = "At line #{original_line_number(@lines_index)}\n"
 		context = 3 # lines
 		from = [@lines_index-context, 0].max
 		to   = [@lines_index+context, @lines.size-1].min
 		for i in from..to
 			prefix = (i == @lines_index) ? '--> ' : '    ';
 			l = @lines[i]
 			s += "%10s %4s|#{l}" %
 				[@lines[i].md_type.to_s, prefix]
 			s += "|\n"
 		end
 #		if @parent 
 #			s << "Parent context is: \n"
 #			s << add_tabs(@parent.describe,1,'|')
 #		end
 		s
 	end
 	def original_line_number(index)
 		if @parent
 			return index + @parent.original_line_number(@parent_offset)
 		else
 			1 + index
 		end
 	end
 	def cur_index
 		@lines_index
 	end
 	# Returns the type of next line as a string
 	# breaks at first :definition
 	def tell_me_the_future
 		s = ""; num_e = 0;
 		for i in @lines_index..@lines.size-1
 			c = case @lines[i].md_type
 				when :text; "t"
 				when :empty; num_e+=1; "e"
 				when :definition; "d"
 				else "o"
 			end
 			s += c
 			break if c == "d" or num_e>1
 		end
 		s	
 	end
 end # linesource
 end end end end # block
--- a/lib/maruku/input/parse_block.rb
+++ b/lib/maruku/input/parse_block.rb
@ -0,0 +1,594 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 module MaRuKu; module In; module Markdown; module BlockLevelParser
 	include Helpers
 	include MaRuKu::Strings
 	include MaRuKu::In::Markdown::SpanLevelParser
 	class BlockContext < Array
 		def describe
 			n = 5
 			desc = size > n ? self[-n,n] : self
 			"Last #{n} elements: "+
 			desc.map{|x| "\n -" + x.inspect}.join
 		end
 	end
 	# Splits the string and calls parse_lines_as_markdown
 	def parse_text_as_markdown(text)
 		lines =  split_lines(text)
 		src = LineSource.new(lines)
 		return parse_blocks(src)
 	end
 	# Input is a LineSource
 	def parse_blocks(src)
 		output = BlockContext.new
 		# run state machine
 		while src.cur_line
 			next if check_block_extensions(src, output, src.cur_line)
 #  Prints detected type (useful for debugging)
 #			puts "#{src.cur_line.md_type}|#{src.cur_line}"
 			case src.cur_line.md_type
 				when :empty; 
 					output.push :empty
 					src.ignore_line
 				when :ial
 					m =  InlineAttributeList.match src.shift_line
 					content = m[1] ||  "" 
 					src2 = CharSource.new(content, src)
 					interpret_extension(src2, output, [nil])
 				when :ald
 					output.push read_ald(src)
 				when :text
 					if src.cur_line =~ MightBeTableHeader and 
 						(src.next_line && src.next_line =~ TableSeparator)
 						output.push read_table(src)
 					elsif [:header1,:header2].include? src.next_line.md_type
 						output.push read_header12(src)
 					elsif eventually_comes_a_def_list(src)
 					 	definition = read_definition(src)
 						if output.last.kind_of?(MDElement) && 
 							output.last.node_type == :definition_list then
 							output.last.children << definition
 						else
 							output.push md_el(:definition_list, [definition])
 						end
 					else # Start of a paragraph
 						output.push read_paragraph(src)
 					end
 				when :header2, :hrule
 					# hrule
 					src.shift_line
 					output.push md_hrule()
 				when :header3
 					output.push read_header3(src)
 				when :ulist, :olist
 					list_type = src.cur_line.md_type == :ulist ? :ul : :ol
 					li = read_list_item(src)
 					# append to current list if we have one
 					if output.last.kind_of?(MDElement) && 
 						output.last.node_type == list_type then
 						output.last.children << li
 					else
 						output.push md_el(list_type, [li])
 					end
 				when :quote;    output.push read_quote(src)
 				when :code;     e = read_code(src); output << e if e
 				when :raw_html; e = read_raw_html(src); output << e if e
 				when :footnote_text;   output.push read_footnote_text(src)
 				when :ref_definition;  output.push read_ref_definition(src)
 				when :abbreviation;    output.push read_abbreviation(src)
 				when :xml_instr;       read_xml_instruction(src, output)
 				when :metadata;        
 					maruku_error "Please use the new meta-data syntax: \n"+
 					"  http://maruku.rubyforge.org/proposal.html\n", src
 					src.ignore_line
 				else # warn if we forgot something
 					md_type = src.cur_line.md_type
 					line = src.cur_line
 					maruku_error "Ignoring line '#{line}' type = #{md_type}", src
 					src.shift_line
 			end
 		end
 		merge_ial(output, src, output)
 		output.delete_if {|x| x.kind_of?(MDElement) &&
 			x.node_type == :ial}
 		# get rid of empty line markers
 		output.delete_if {|x| x == :empty}
 		# See for each list if we can omit the paragraphs and use li_span
 		# TODO: do this after
 		output.each do |c| 
 			# Remove paragraphs that we can get rid of
 			if [:ul,:ol].include? c.node_type 
 				if c.children.all? {|li| !li.want_my_paragraph} then
 					c.children.each do |d|
 						d.node_type = :li_span
 						d.children = d.children[0].children 
 					end
 				end
 			end 
 			if c.node_type == :definition_list
 				if c.children.all?{|defi| !defi.want_my_paragraph} then
 					c.children.each do |definition| 
 						definition.definitions.each do |dd|
 							dd.children = dd.children[0].children 
 						end
 					end
 				end
 			end 
 		end
 		output
 	end
 	def read_ald(src)
 		if (l=src.shift_line) =~ AttributeDefinitionList
 			id = $1;   al=$2;
 			al = read_attribute_list(CharSource.new(al,src), context=nil, break_on=[nil])
 			self.ald[id] = al;
 			return md_ald(id, al)
 		else
 			maruku_error "Bug Bug:\n#{l.inspect}"
 			return nil
 		end
 	end
 	# reads a header (with ----- or ========)
 	def read_header12(src)
 		line = src.shift_line.strip
 		al = nil
 		# Check if there is an IAL
 		if new_meta_data? and line =~ /^(.*)\{(.*)\}\s*$/
 			line = $1.strip
 			ial = $2
 			al  = read_attribute_list(CharSource.new(ial,src), context=nil, break_on=[nil])
 		end
 		text = parse_lines_as_span [ line ]
 		level = src.cur_line.md_type == :header2 ? 2 : 1;  
 		src.shift_line
 		return md_header(level, text, al)
 	end
 	# reads a header like '#### header ####'	
 	def read_header3(src)
 		line = src.shift_line.strip
 		al = nil
 		# Check if there is an IAL
 		if new_meta_data? and line =~ /^(.*)\{(.*)\}\s*$/
 			line = $1.strip
 			ial = $2
 			al  = read_attribute_list(CharSource.new(ial,src), context=nil, break_on=[nil])
 		end
 		level = num_leading_hashes(line)
 		text = parse_lines_as_span [strip_hashes(line)] 
 		return md_header(level, text, al)
 	end
 	def read_xml_instruction(src, output)
 		m = /^\s*<\?((\w+)\s*)?(.*)$/.match src.shift_line
 		raise "BugBug" if not m
 		target = m[2] || ''
 		code = m[3]
 		until code =~ /\?>/
 			code += "\n"+src.shift_line
 		end
 		if not code =~ (/\?>\s*$/)
 			garbage = (/\?>(.*)$/.match(code))[1]
 			maruku_error "Trailing garbage on last line: #{garbage.inspect}:\n"+
 				add_tabs(code, 1, '|'), src
 		end
 		code.gsub!(/\?>\s*$/, '')
 		if target == 'mrk' && MaRuKu::Globals[:unsafe_features]
 			result = safe_execute_code(self, code)	
 			if result
 				if result.kind_of? String
 					raise "Not expected"
 				else
 					output.push *result
 				end
 			end
 		else
 			output.push md_xml_instr(target, code)
 		end
 	end
 	def read_raw_html(src)
 		h = HTMLHelper.new
 		begin 
 			h.eat_this(l=src.shift_line)
 #			puts "\nBLOCK:\nhtml -> #{l.inspect}"
 			while src.cur_line and not h.is_finished? 
 				l=src.shift_line
 #				puts "html -> #{l.inspect}"
 				h.eat_this "\n"+l
 			end
 		rescue Exception => e
 			ex = e.inspect + e.backtrace.join("\n")
 			maruku_error "Bad block-level HTML:\n#{add_tabs(ex,1,'|')}\n", src
 		end
 		raw_html = h.stuff_you_read
 		return md_html(raw_html)
 	end
 	def read_paragraph(src)
 		lines = []
 		while src.cur_line 
 			# :olist does not break
 			case t = src.cur_line.md_type
 				when :quote,:header3,:empty,:raw_html,:ref_definition,:ial,:xml_instr
 					break
 				when :olist,:ulist
 					break if src.next_line.md_type == t
 			end
 			break if src.cur_line.strip.size == 0			
 			break if [:header1,:header2].include? src.next_line.md_type
 			break if any_matching_block_extension?(src.cur_line)
 			lines << src.shift_line
 		end
 #		dbg_describe_ary(lines, 'PAR')
 		children = parse_lines_as_span(lines, src)
 		return md_par(children)
 	end
 	# Reads one list item, either ordered or unordered.
 	def read_list_item(src)
 		parent_offset = src.cur_index
 		item_type = src.cur_line.md_type
 		first = src.shift_line
 		# Ugly things going on inside `read_indented_content`
 		indentation = spaces_before_first_char(first)
 		break_list = [:ulist, :olist, :ial]
 		lines, want_my_paragraph = 
 			read_indented_content(src,indentation, break_list, item_type)
 		# add first line
 			# Strip first '*', '-', '+' from first line
 			stripped = first[indentation, first.size-1]
 		lines.unshift stripped
 		#dbg_describe_ary(lines, 'LIST ITEM ')
 		src2 = LineSource.new(lines, src, parent_offset)
 		children = parse_blocks(src2)
 		with_par = want_my_paragraph || (children.size>1)
 		return md_li(children, with_par)
 	end
 	def read_abbreviation(src)
 		if not (l=src.shift_line) =~ Abbreviation
 			maruku_error "Bug: it's Andrea's fault. Tell him.\n#{l.inspect}"
 		end
 		abbr = $1
 		desc = $2
 		if (not abbr) or (abbr.size==0)
 			maruku_error "Bad abbrev. abbr=#{abbr.inspect} desc=#{desc.inspect}"
 		end
 		self.abbreviations[abbr] = desc
 		return md_abbr_def(abbr, desc)
 	end
 	def read_footnote_text(src)
 		parent_offset = src.cur_index
 		first = src.shift_line
 		if not first =~ FootnoteText 
 			maruku_error "Bug (it's Andrea's fault)"
 		end
 		id = $1
 		text = $2
 		# Ugly things going on inside `read_indented_content`
 		indentation = 4 #first.size-text.size
 #		puts "id =_#{id}_; text=_#{text}_ indent=#{indentation}"
 		break_list = [:footnote_text]
 		item_type = :footnote_text
 		lines, want_my_paragraph = 
 			read_indented_content(src,indentation, break_list, item_type)
 		# add first line
 		if text && text.strip != "" then lines.unshift text end
 #		dbg_describe_ary(lines, 'FOOTNOTE')
 		src2 = LineSource.new(lines, src, parent_offset)
 		children = parse_blocks(src2)
 		e = md_footnote(id, children)
 		self.footnotes[id] = e
 		return e
 	end
 	# This is the only ugly function in the code base.
 	# It is used to read list items, descriptions, footnote text
 	def read_indented_content(src, indentation, break_list, item_type)
 		lines =[]
 		# collect all indented lines
 		saw_empty = false; saw_anything_after = false
 		while src.cur_line 
 			#puts "#{src.cur_line.md_type} #{src.cur_line.inspect}"
 			if src.cur_line.md_type == :empty
 				saw_empty = true
 				lines << src.shift_line
 				next
 			end
 			# after a white line
 			if saw_empty
 				# we expect things to be properly aligned
 				if (ns=number_of_leading_spaces(src.cur_line)) < indentation
 					#puts "breaking for spaces, only #{ns}: #{src.cur_line}"
 					break
 				end
 				saw_anything_after = true
 			else
 				break if break_list.include? src.cur_line.md_type
 #				break if src.cur_line.md_type != :text
 			end
 			stripped = strip_indent(src.shift_line, indentation)
 			lines << stripped
 			#puts "Accepted as #{stripped.inspect}"
 			# You are only required to indent the first line of 
 			# a child paragraph.
 			if stripped.md_type == :text
 				while src.cur_line && (src.cur_line.md_type == :text)
 					lines << strip_indent(src.shift_line, indentation)
 				end
 			end
 		end
 		want_my_paragraph = saw_anything_after || 
 			(saw_empty && (src.cur_line  && (src.cur_line.md_type == item_type))) 
 #		dbg_describe_ary(lines, 'LI')
 		# create a new context 
 		while lines.last && (lines.last.md_type == :empty)
 			lines.pop
 		end
 		return lines, want_my_paragraph
 	end
 	def read_quote(src)
 		parent_offset = src.cur_index
 		lines = []
 		# collect all indented lines
 		while src.cur_line && src.cur_line.md_type == :quote
 			lines << unquote(src.shift_line)
 		end
 #		dbg_describe_ary(lines, 'QUOTE')
 		src2 = LineSource.new(lines, src, parent_offset)
 		children = parse_blocks(src2)
 		return md_quote(children)
 	end
 	def read_code(src)
 		# collect all indented lines
 		lines = []
 		while src.cur_line && ([:code, :empty].include? src.cur_line.md_type)
 			lines << strip_indent(src.shift_line, 4)
 		end
 		#while lines.last && (lines.last.md_type == :empty )
 		while lines.last && lines.last.strip.size == 0
 			lines.pop 
 		end
 		while lines.first && lines.first.strip.size == 0
 			lines.shift 
 		end
 		return nil if lines.empty?
 		source = lines.join("\n")
 #		dbg_describe_ary(lines, 'CODE')
 		return md_codeblock(source)
 	end
 	# Reads a series of metadata lines with empty lines in between
 	def read_metadata(src)
 		hash = {}
 		while src.cur_line 
 			case src.cur_line.md_type
 				when :empty;  src.shift_line
 				when :metadata; hash.merge! parse_metadata(src.shift_line)
 				else break
 			end
 		end
 		hash
 	end
 	def read_ref_definition(src)
 		line = src.shift_line
 		# if link is incomplete, shift next line
 		if src.cur_line && (src.cur_line.md_type != :ref_definition) && 
 			([1,2,3].include? number_of_leading_spaces(src.cur_line) )
 			line += " "+ src.shift_line
 		end
 #		puts "total= #{line}"
 		match = LinkRegex.match(line)
 		if not match
 			error "Link does not respect format: '#{line}'"
 		end
 		id = match[1]; url = match[2]; title = match[3]; 
 		id = id.strip.downcase
 		hash = self.refs[id] = {:url=>url,:title=>title}
 		stuff=match[4]
 		if stuff
 			stuff.split.each do |couple|
 #					puts "found #{couple}"
 				k, v = couple.split('=')
 				v ||= ""
 				if v[0,1]=='"' then v = v[1, v.size-2] end
 #					puts "key:_#{k}_ value=_#{v}_"
 				hash[k.to_sym] = v
 			end
 		end
 #			puts hash.inspect
 		return md_ref_def(id, url, meta={:title=>title})
 	end
 	def read_table(src)
 		def split_cells(s)
 			s.strip.split('|').select{|x|x.strip.size>0}.map{|x|x.strip}
 		end
 		head = split_cells(src.shift_line).map{|s| md_el(:head_cell, parse_lines_as_span([s])) }
 		separator=split_cells(src.shift_line)
 		align = separator.map { |s|  s =~ Sep
 			if $1 and $2 then :center elsif $2 then :right else :left end }
 		num_columns = align.size
 		if head.size != num_columns
 			maruku_error "Table head does not have #{num_columns} columns: \n#{head.inspect}"
 			tell_user "I will ignore this table."
 			# XXX try to recover
 			return md_br()
 		end
 		rows = []
 		while src.cur_line && src.cur_line =~ /\|/
 			row = split_cells(src.shift_line).map{|s|
 				md_el(:cell, parse_lines_as_span([s]))}
 			if head.size != num_columns
 				maruku_error  "Row does not have #{num_columns} columns: \n#{row.inspect}"
 				tell_user "I will ignore this table."
 				# XXX try to recover
 				return md_br()
 			end
 			rows << row
 		end
 		children = (head+rows).flatten
 		return md_el(:table, children, {:align => align})
 	end
 	# If current line is text, a definition list is coming
 	# if 1) text,empty,[text,empty]*,definition
 	def eventually_comes_a_def_list(src)
 		future = src.tell_me_the_future
 		ok = future =~ %r{^t+e?d}x
 #		puts "future: #{future} - #{ok}"
 		ok
 	end
 	def read_definition(src)
 		# Read one or more terms
 		terms = []
 		while  src.cur_line &&  src.cur_line.md_type == :text
 			terms << md_el(:definition_term, parse_lines_as_span([src.shift_line]))
 		end
 #		dbg_describe_ary(terms, 'DT')
 		want_my_paragraph = false
 		raise "Chunky Bacon!" if not src.cur_line
 		# one optional empty
 		if src.cur_line.md_type == :empty
 			want_my_paragraph = true
 			src.shift_line
 		end
 		raise "Chunky Bacon!" if src.cur_line.md_type != :definition
 		# Read one or more definitions
 		definitions = []
 		while src.cur_line && src.cur_line.md_type == :definition
 			parent_offset = src.cur_index
 			first = src.shift_line
 			first =~ Definition
 			first = $1
 			# I know, it's ugly!!!
 			lines, w_m_p = 
 				read_indented_content(src,4, [:definition], :definition)
 			want_my_paragraph ||= w_m_p
 			lines.unshift first
 #			dbg_describe_ary(lines, 'DD')
 			src2 = LineSource.new(lines, src, parent_offset)
 			children = parse_blocks(src2)
 			definitions << md_el(:definition_data, children)
 		end
 		return md_el(:definition, terms+definitions, { 	
 			:terms => terms, 
 			:definitions => definitions, 
 			:want_my_paragraph => want_my_paragraph})
 	end
 end # BlockLevelParser
 end # MaRuKu
 end
 end
--- a/lib/maruku/input/parse_doc.rb
+++ b/lib/maruku/input/parse_doc.rb
@ -0,0 +1,225 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 require 'iconv'
 module MaRuKu; module In; module Markdown; module BlockLevelParser
 	def parse_doc(s)
 		meta2 =  parse_email_headers(s)
 		data = meta2[:data]
 		meta2.delete :data
 		self.attributes.merge! meta2
 =begin maruku_doc
 Attribute: encoding
 Scope:     document
 Summary:   Encoding for the document.
 If the `encoding` attribute is specified, then the content
 will be converted from the specified encoding to UTF-8.
 Conversion happens using the `iconv` library.
 =end
 		enc = self.attributes[:encoding]
 		self.attributes.delete :encoding
 		if enc && enc.downcase != 'utf-8'
 			converted = Iconv.new('utf-8', enc).iconv(data)
 #			puts "Data: #{data.inspect}: #{data}"
 #			puts "Conv: #{converted.inspect}: #{converted}"
 			data = converted
 		end
 		@children = parse_text_as_markdown(data)
 		if true #markdown_extra? 
 			self.search_abbreviations
 			self.substitute_markdown_inside_raw_html
 		end
 		toc = create_toc
 		# use title if not set
 		if not self.attributes[:title] and toc.header_element
 			title = toc.header_element.to_s
 			self.attributes[:title]  = title
 #			puts "Set document title to #{title}"
 		end
 		# save for later use
 		self.toc = toc
 		# Now do the attributes magic
 		each_element do |e|
 			# default attribute list
 			if default = self.ald[e.node_type.to_s]
 				expand_attribute_list(default, e.attributes)
 			end
 			expand_attribute_list(e.al, e.attributes)
 #			puts "#{e.node_type}: #{e.attributes.inspect}"
 		end
 =begin maruku_doc
 Attribute: unsafe_features
 Scope:     global
 Summary:   Enables execution of XML instructions.
 Disabled by default because of security concerns.
 =end
 		if Maruku::Globals[:unsafe_features]
 			self.execute_code_blocks
 			# TODO: remove executed code blocks
 		end
 	end
 	# Expands an attribute list in an Hash
 	def expand_attribute_list(al, result)
 		al.each do |k, v|
 			case k
 			when :class
 				if not result[:class]
 					result[:class] = v
 				else
 					result[:class] += " " + v
 				end
 			when :id; result[:id] = v
 			when :ref; 
 				if self.ald[v]
 					already = (result[:expanded_references] ||= [])
 					if not already.include?(v)
 						already.push v
 						expand_attribute_list(self.ald[v], result)
 					else
 						already.push  v
 						maruku_error "Circular reference between labels.\n\n"+
 						"Label #{v.inspect} calls itself via recursion.\nThe recursion is "+
 							(already.map{|x| x.inspect}.join(' => ')) 
 					end
 				else
 					if not result[:unresolved_references]
 						result[:unresolved_references] = v
 					else
 						result[:unresolved_references] << " #{v}"
 					end
 					result[v.to_sym] = true
 				end
 			else
 				result[k.to_sym]=v
 			end
 		end
 	end
 	def safe_execute_code(object, code)
 		begin
 			return object.instance_eval(code)
 		rescue Exception => e
 			maruku_error "Exception while executing this:\n"+
 				add_tabs(code, 1, ">")+
 				"\nThe error was:\n"+
 				add_tabs(e.inspect+"\n"+e.caller.join("\n"), 1, "|")
 		rescue RuntimeError => e
 			maruku_error "2: Exception while executing this:\n"+
 				add_tabs(code, 1, ">")+
 				"\nThe error was:\n"+
 				add_tabs(e.inspect, 1, "|")
 		rescue SyntaxError => e
 			maruku_error "2: Exception while executing this:\n"+
 				add_tabs(code, 1, ">")+
 				"\nThe error was:\n"+
 				add_tabs(e.inspect, 1, "|")
 		end
 		nil
 	end
 	def execute_code_blocks
 		self.each_element(:xml_instr) do |e|
 			if e.target == 'maruku'
 				result = safe_execute_code(e, e.code)
 				if result.kind_of?(String)
 					puts "Result is : #{result.inspect}"
 				end
 			end
 		end
 	end
 	def search_abbreviations
 		self.abbreviations.each do |abbrev, title|
 			reg = Regexp.new(Regexp.escape(abbrev))
 			self.replace_each_string do |s|
 				if m = reg.match(s)
 					e = md_abbr(abbrev.dup, title ? title.dup : nil)
 					[m.pre_match, e, m.post_match]
 				else
 					s
 				end
 			end
 		end
 	end
 	include REXML
 	# (PHP Markdown extra) Search for elements that have
 	# markdown=1 or markdown=block defined
 	def substitute_markdown_inside_raw_html
 		self.each_element(:raw_html) do |e|
 			doc = e.instance_variable_get :@parsed_html
 			if doc # valid html
 				# parse block-level markdown elements in these HTML tags
 				block_tags = ['div']
 				# use xpath to find elements with 'markdown' attribute
 				XPath.match(doc, "//*[attribute::markdown]" ).each do |e|
 #					puts "Found #{e}"
 					# should we parse block-level or span-level?
 					parse_blocks = (e.attributes['markdown'] == 'block') || 
 					               block_tags.include?(e.name)
 					# remove 'markdown' attribute
 					e.delete_attribute 'markdown'
 					# Select all text elements of e
 					XPath.match(e, "//text()" ).each { |original_text| 
 						s = original_text.value.strip
 						if s.size > 0
 							el = md_el(:dummy,
 							 	parse_blocks ? parse_text_as_markdown(s) :
 							                  parse_lines_as_span([s]) )
 							p = original_text.parent
 							el.children_to_html.each do |x|
 								p.insert_before(original_text, x)
 							end
 							p.delete(original_text)
 						end
 					}
 				end
 			end
 		end
 	end
 end end end end
--- a/lib/maruku/input/parse_span_better.rb
+++ b/lib/maruku/input/parse_span_better.rb
@ -0,0 +1,692 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 require 'set'
 module MaRuKu; module In; module Markdown; module SpanLevelParser
 	include MaRuKu::Helpers
 	EscapedCharInText = 
 		Set.new [?\\,?`,?*,?_,?{,?},?[,?],?(,?),?#,?.,?!,?|,?:,?+,?-,?>]
 	EscapedCharInQuotes = 
 		Set.new [?\\,?`,?*,?_,?{,?},?[,?],?(,?),?#,?.,?!,?|,?:,?+,?-,?>,?',?"]
 	EscapedCharInInlineCode = [?\\,?`]
 	def parse_lines_as_span(lines, parent=nil)
 		parse_span_better lines.join("\n"), parent
 	end
 	def parse_span_better(string, parent=nil)
 		if not string.kind_of? String then 
 			error "Passed #{string.class}." end
 		st = (string + "")
 		st.freeze
 		src = CharSource.new(st, parent)
 		read_span(src, EscapedCharInText, [nil])
 	end
 	# This is the main loop for reading span elements
 	#
 	# It's long, but not *complex* or difficult to understand.
 	#
 	#
 	def read_span(src, escaped, exit_on_chars, exit_on_strings=nil)
 		con = SpanContext.new
 		c = d = nil
 		while true
 			c = src.cur_char
 			# This is only an optimization which cuts 50% of the time used.
 			# (but you can't use a-zA-z in exit_on_chars)
 			if c && ((c>=?a && c<=?z) || ((c>=?A && c<=?Z)))
 				con.cur_string << src.shift_char
 				next
 			end
 			break if exit_on_chars && exit_on_chars.include?(c)
 			break if exit_on_strings && exit_on_strings.any? {|x| src.cur_chars_are x}
 			# check if there are extensions
 			if check_span_extensions(src, con)
 				next
 			end
 			case c = src.cur_char	
 			when ?\ # it's space (32)
 				if src.cur_chars_are "  \n"
 					src.ignore_chars(3)
 					con.push_element  md_br()
 					next
 				else
 					src.ignore_char
 					con.push_space 
 				end
 			when ?\n, ?\t 
 				src.ignore_char
 				con.push_space 
 			when ?`
 				read_inline_code(src,con)
 			when ?<
 				# It could be:
 				# 1) HTML "<div ..."
 				# 2) HTML "<!-- ..."
 				# 3) url "<http:// ", "<ftp:// ..."
 				# 4) email "<andrea@... ", "<mailto:andrea@..."
 				# 5) on itself! "a < b	"
 				# 6) Start of <<guillemettes>>
 				case d = src.next_char
 					when ?<;  # guillemettes
 						src.ignore_chars(2)
 						con.push_char ?<
 						con.push_char ?<
 					when ?!; 
 						if src.cur_chars_are '<!--'
 							read_inline_html(src, con)
 						else 
 							con.push_char src.shift_char
 						end
 					when ?? 
 						read_xml_instr_span(src, con) 
 					when ?\ , ?\t 
 						con.push_char src.shift_char
 					else
 						if src.next_matches(/<mailto:/) or
 						   src.next_matches(/<[\w\.]+\@/)
 							read_email_el(src, con)
 						elsif src.next_matches(/<\w+:/)
 							read_url_el(src, con)
 						elsif src.next_matches(/<\w/)
 							#puts "This is HTML: #{src.cur_chars(20)}"
 							read_inline_html(src, con)
 						else 
 							#puts "This is NOT HTML: #{src.cur_chars(20)}"
 							con.push_char src.shift_char
 						end
 				end
 			when ?\\
 				d = src.next_char
 				if d == ?'
 					src.ignore_chars(2)
 					con.push_element md_entity('apos')
 				elsif d == ?"
 					src.ignore_chars(2)
 					con.push_element md_entity('quot')
 				elsif escaped.include? d
 					src.ignore_chars(2)
 					con.push_char d
 				else
 					con.push_char src.shift_char
 				end
 			when ?[
 				if markdown_extra? && src.next_char == ?^
 					read_footnote_ref(src,con)
 				else
 					read_link(src, con)
 				end
 			when ?!
 				if src.next_char == ?[
 					read_image(src, con)
 				else
 					con.push_char src.shift_char
 				end
 			when ?&
 				if m = src.read_regexp(/\&([\w\d]+);/)
 					con.push_element md_entity(m[1])
 				else
 					con.push_char src.shift_char
 				end
 			when ?*
 				if not src.next_char
 					maruku_error "Opening * as last char.", src, con
 					maruku_recover "Threating as literal"
 					con.push_char src.shift_char
 				else
 					follows = src.cur_chars(4)
 					if follows =~ /^\*\*\*[^\s\*]/
 						con.push_element read_emstrong(src,'***')
 					elsif follows  =~ /^\*\*[^\s\*]/
 						con.push_element read_strong(src,'**')
 					elsif follows =~ /^\*[^\s\*]/
 						con.push_element read_em(src,'*')
 					else # * is just a normal char
 						con.push_char src.shift_char
 					end
 				end
 			when ?_
 				if not src.next_char
 					maruku_error "Opening _ as last char", src, con
 					maruku_recover "Threating as literal", src, con
 					con.push_char src.shift_char
 				else
 					follows = src.cur_chars(4)
 					if  follows =~ /^\_\_\_[^\s\_]/
 						con.push_element read_emstrong(src,'___')
 					elsif follows  =~ /^\_\_[^\s\_]/
 						con.push_element read_strong(src,'__')
 					elsif follows =~ /^\_[^\s\_]/
 						con.push_element read_em(src,'_')
 					else # _ is just a normal char
 						con.push_char src.shift_char
 					end
 				end
 			when ?{ # extension
 				src.ignore_char # {
 				interpret_extension(src, con, [?}])
 				src.ignore_char # }
 			when nil
 				maruku_error ("Unclosed span (waiting for %s"+
 				 "#{exit_on_strings.inspect})") % [
 						exit_on_chars ? "#{exit_on_chars.inspect} or" : ""],
 						src,con
 				break
 			else # normal text
 				con.push_char src.shift_char
 			end # end case
 		end # end while true
 		con.push_string_if_present 
 		# Assign IAL to elements
 		merge_ial(con.elements, src, con)
 		# Remove leading space
 		if (s = con.elements.first).kind_of? String
 			if s[0] == ?\ then con.elements[0] = s[1, s.size-1] end
 			con.elements.shift if s.size == 0 
 		end
 		# Remove final spaces
 		if (s = con.elements.last).kind_of? String
 			s.chop! if s[-1] == ?\ 
 			con.elements.pop if s.size == 0 
 		end
 		educated = educate(con.elements)
 		educated
 	end
 	def read_xml_instr_span(src, con) 
 		src.ignore_chars(2) # starting <?
 		# read target <?target code... ?>
 		target = if m = src.read_regexp(/(\w+)/)
 			m[1]
 		else
 			''
 		end
 		delim = "?>"
 		code = 
 			read_simple(src, escaped=[], break_on_chars=[], 
 			break_on_strings=[delim])
 		src.ignore_chars delim.size
 		code = (code || "").strip
 		con.push_element md_xml_instr(target, code)
 	end
 	# Start: cursor on character **after** '{'
 	# End: curson on '}' or EOF
 	def interpret_extension(src, con, break_on_chars)
 		case src.cur_char
 		when ?:
 			src.ignore_char # :
 			extension_meta(src, con, break_on_chars)
 		when ?#, ?.
 			extension_meta(src, con, break_on_chars)
 		else
 			stuff = read_simple(src, escaped=[?}], break_on_chars, [])
 			if stuff =~ /^(\w+\s|[^\w])/
 				extension_id = $1.strip
 				if false
 				else
 					maruku_recover "I don't know what to do with extension '#{extension_id}'\n"+
 						"I will threat this:\n\t{#{stuff}} \n as meta-data.\n", src, con
 					extension_meta(src, con, break_on_chars)
 				end
 			else 
 				maruku_recover "I will threat this:\n\t{#{stuff}} \n as meta-data.\n", src, con
 				extension_meta(src, con, break_on_chars)
 			end
 		end
 	end
 	def extension_meta(src, con, break_on_chars)
 		if m = src.read_regexp(/(\w)+\:/)
 			name = m[1]
 			content = m[2]
 			al = read_attribute_list(src, con, break_on_chars)
 			self.doc.ald[name] = al
 		 	con.push md_ald(name, al)
 		else
 			al = read_attribute_list(src, con, break_on_chars)
 			self.doc.ald[name] = al
 			con.push md_ial(al)
 		end
 	end	
 	def read_url_el(src,con)
 		src.ignore_char # leading <
 		url = read_simple(src, [], [?>])
 		src.ignore_char # closing >
 		con.push_element md_url(url)
 	end
 	def read_email_el(src,con)
 		src.ignore_char # leading <
 		mail = read_simple(src, [], [?>])
 		src.ignore_char # closing >
 		address = mail.gsub(/^mailto:/,'')
 		con.push_element md_email(address)
 	end
 	def read_url(src, break_on)
 		if [?',?"].include? src.cur_char 
 			error 'Invalid char for url', src
 		end
 		url = read_simple(src, [], break_on)
 		if not url # empty url
 			url = ""
 		end
 		if url[0] == ?< && url[-1] == ?>
 			url = url[1, url.size-2]
 		end
 		if url.size == 0 
 			return nil
 		end
 		url
 	end
 	def read_quoted_or_unquoted(src, con, escaped, exit_on_chars)
 		case src.cur_char
 		when ?', ?"
 			read_quoted(src, con)
 		else
 			read_simple(src, escaped, exit_on_chars)
 		end
 	end
 	# Tries to read a quoted value. If stream does not
 	# start with ' or ", returns nil.
 	def read_quoted(src, con)
 		case src.cur_char
 			when ?', ?"
 				quote_char = src.shift_char # opening quote
 				string = read_simple(src, EscapedCharInQuotes, [quote_char])
 				src.ignore_char # closing quote
 				return string
 			else 
 #				puts "Asked to read quote from: #{src.cur_chars(10).inspect}"
 				return nil
 		end
 	end
 	# Reads a simple string (no formatting) until one of break_on_chars, 
 	# while escaping the escaped.
 	# If the string is empty, it returns nil.
 	# Raises on error if the string terminates unexpectedly.
 #	# If eat_delim is true, and if the delim is not the EOF, then the delim
 #	# gets eaten from the stream.
 	def read_simple(src, escaped, exit_on_chars, exit_on_strings=nil)
 		text = ""
 		while true
 #			puts "Reading simple #{text.inspect}"
 			c = src.cur_char
 			if exit_on_chars && exit_on_chars.include?(c)
 #				src.ignore_char if eat_delim
 				break
 			end
 			break if exit_on_strings && 
 				exit_on_strings.any? {|x| src.cur_chars_are x}
 			case c
 			when nil
 				s= "String finished while reading (break on "+
 				"#{exit_on_chars.map{|x|""<<x}.inspect})"+
 				" already read: #{text.inspect}"
 				maruku_error s, src
 				maruku_recover "I boldly continue", src
 				break
 			when ?\\
 				d = src.next_char
 				if escaped.include? d
 					src.ignore_chars(2)
 					text << d
 				else
 					text << src.shift_char
 				end
 			else 
 				text << src.shift_char
 			end
 		end
 #		puts "Read simple #{text.inspect}"
 		text.empty? ? nil : text
 	end
 	def read_em(src, delim)
 		src.ignore_char
 		children = read_span(src, EscapedCharInText, nil, [delim])
 		src.ignore_char
 		md_em(children)
 	end
 	def read_strong(src, delim)
 		src.ignore_chars(2)
 		children = read_span(src, EscapedCharInText, nil, [delim])
 		src.ignore_chars(2)
 		md_strong(children)
 	end
 	def read_emstrong(src, delim)
 		src.ignore_chars(3)
 		children = read_span(src, EscapedCharInText, nil, [delim])
 		src.ignore_chars(3)
 		md_emstrong(children)
 	end
 	SPACE = ?\ # = 32
 #	R_REF_ID = Regexp.compile(/([^\]\s]*)(\s*\])/)
 	R_REF_ID = Regexp.compile(/([^\]\s]*)(\s*\])/)
 	# Reads a bracketed id "[refid]". Consumes also both brackets.
 	def read_ref_id(src, con)
 		src.ignore_char # [
 		src.consume_whitespace
 #		puts "Next: #{src.cur_chars(10).inspect}"
 		if m = src.read_regexp(R_REF_ID) 
 #			puts "Got: #{m[1].inspect} Ignored: #{m[2].inspect}"
 #			puts "Then: #{src.cur_chars(10).inspect}"
 			m[1]
 		else
 			nil
 		end
 	end
 	def read_footnote_ref(src,con)
 		ref = read_ref_id(src,con)
 		con.push_element md_foot_ref(ref)
 	end
 	def read_inline_html(src, con)
 		h = HTMLHelper.new
 		begin
 			# This is our current buffer in the context
 			start = src.current_remaining_buffer
 			h.eat_this start
 			if not h.is_finished?
 				error "inline_html: Malformed:\n "+
 					"#{start.inspect}\n #{h.inspect}",src,con
 			end
 			consumed = start.size - h.rest.size 
 			if consumed > 0
 				con.push_element md_html(h.stuff_you_read)
 				src.ignore_chars(consumed)
 			else
 				puts "HTML helper did not work on #{start.inspect}"
 				con.push_char src.shift_char
 			end
 		rescue Exception => e
 			maruku_error "Bad html: \n" + 
 				add_tabs(e.inspect+e.backtrace.join("\n"),1,'>'),
 				src,con
 			maruku_recover "I will try to continue after bad HTML.", src, con
 			con.push_char src.shift_char
 		end
 	end
 	def read_inline_code(src, con)
 		# Count the number of ticks
 		num_ticks = 0
 		while src.cur_char == ?` 
 			num_ticks += 1
 			src.ignore_char
 		end
 		# We will read until this string
 		end_string = "`"*num_ticks
 		code = 
 			read_simple(src, escaped=[], break_on_chars=[], 
 				break_on_strings=[end_string])
 #		puts "Now I expects #{num_ticks} ticks: #{src.cur_chars(10).inspect}"
 		src.ignore_chars num_ticks
 		# Ignore at most one space
 		if num_ticks > 1 && code[0] == SPACE
 			code = code[1, code.size-1]
 		end
 		# drop last space 
 		if num_ticks > 1 && code[-1] == SPACE
 			code = code[0,code.size-1]
 		end
 #		puts "Read `` code: #{code.inspect}; after: #{src.cur_chars(10).inspect} "
 		con.push_element md_code(code)
 	end
 	def read_link(src, con)
 		# we read the string and see what happens
 		src.ignore_char # opening bracket
 		children = read_span(src, EscapedCharInText, [?]])
 		src.ignore_char # closing bracket
 		# ignore space
 		if src.cur_char == SPACE and 
 			(src.next_char == ?[ or src.next_char == ?( )
 			src.shift_char
 		end
 		case src.cur_char
 		when ?(
 			src.ignore_char # opening (
 			src.consume_whitespace
 			url = read_url(src, [SPACE,?\t,?)])
 			if not url
 				url = '' # no url is ok
 			end
 			src.consume_whitespace
 			title = nil
 			if src.cur_char != ?) # we have a title
 				quote_char = src.cur_char
 				title = read_quoted(src,con)
 				if not title
 					maruku_error 'Must quote title',src,con
 				else
 					# Tries to read a title with quotes: ![a](url "ti"tle")
 					# this is the most ugly thing in Markdown
 					if not src.next_matches(/\s*\)/)
 						# if there is not a closing par ), then read
 						# the rest and guess it's title with quotes
 						rest = read_simple(src, escaped=[], break_on_chars=[?)], 
 							break_on_strings=[])
 						# chop the closing char
 						rest.chop!
 						title << quote_char << rest
 					end
 				end
 			end
 			src.consume_whitespace
 			closing = src.shift_char # closing )
 			if closing != ?)
 				maruku_error 'Unclosed link',src,con
 				maruku_recover "No closing ): I will not create"+
 				" the link for #{children.inspect}", src, con
 				con.push_elements children
 				return
 			end
 			con.push_element md_im_link(children,url, title)
 		when ?[ # link ref
 			ref_id = read_ref_id(src,con)
 			if ref_id
 				con.push_element md_link(children, ref_id)
 			else 
 				maruku_error "Could not read ref_id", src, con
 				maruku_recover "I will not create the link for "+
 					"#{children.inspect}", src, con
 				con.push_elements children
 				return
 			end
 		else # empty [link]
 			con.push_element md_link(children, "")
 		end
 	end # read link
 	def read_image(src, con)
 		src.ignore_chars(2) # opening "!["
 		alt_text = read_span(src, EscapedCharInText, [?]])
 		src.ignore_char # closing bracket
 		# ignore space
 		if src.cur_char == SPACE and 
 			(src.next_char == ?[ or src.next_char == ?( )
 			src.ignore_char
 		end
 		case src.cur_char
 		when ?(
 			src.ignore_char # opening (
 			src.consume_whitespace
 			url = read_url(src, [SPACE,?\t,?)])
 			if not url
 				error "Could not read url from #{src.cur_chars(10).inspect}",
 					src,con
 			end
 			src.consume_whitespace
 			title = nil
 			if src.cur_char != ?) # we have a title
 				quote_char = src.cur_char
 				title = read_quoted(src,con)
 				if not title
 					maruku_error 'Must quote title',src,con
 				else				
 					# Tries to read a title with quotes: ![a](url "ti"tle")
 					# this is the most ugly thing in Markdown
 					if not src.next_matches(/\s*\)/)
 						# if there is not a closing par ), then read
 						# the rest and guess it's title with quotes
 						rest = read_simple(src, escaped=[], break_on_chars=[?)], 
 							break_on_strings=[])
 						# chop the closing char
 						rest.chop!
 						title << quote_char << rest
 					end
 				end
 			end
 			src.consume_whitespace
 			closing = src.shift_char # closing )
 			if closing != ?)
 				error ("Unclosed link: '"<<closing<<"'")+
 					" Read url=#{url.inspect} title=#{title.inspect}",src,con
 			end
 			con.push_element md_im_image(alt_text, url, title)
 		when ?[ # link ref
 			ref_id = read_ref_id(src,con)
 			con.push_element md_image(alt_text, ref_id)
 		else # no stuff
 			con.push_elements children
 		end
 	end # read link
 	class SpanContext 
 		include MaRuKu::Strings
 		# Read elements
 		attr_accessor :elements
 		attr_accessor :cur_string
 		def initialize
 			@elements = []
 			@cur_string = ""
 		end
 		def push_element(e)
 			raise "Only MDElement and String, please. You pushed #{e.class}: #{e.inspect} " if
 			 not (e.kind_of?(String) or e.kind_of?(MDElement))
 			push_string_if_present
 			@elements << e
 			nil
 		end
 		alias push push_element
 		def push_elements(a)
 			for e in a 
 				if e.kind_of? String
 					e.each_byte do |b| push_char b end
 				else
 					push_element e
 				end
 			end
 		end
 		def push_string_if_present
 			if @cur_string.size > 0
 				@elements << @cur_string
 				@cur_string = ""
 			end
 			nil
 		end
 		def push_char(c)
 			@cur_string << c 
 			nil
 		end
 		# push space into current string if
 		# there isn't one
 		def push_space
 			last = @cur_string[@cur_string.size-1]
 			@cur_string << ?\  if last != ?\ 
 		end
 		def describe
 			lines = @elements.map{|x| x.inspect}.join("\n")
 			s = "Elements read in span: \n" +
 			add_tabs(lines,1, ' -')+"\n"
 			if @cur_string.size > 0
 			s += "Current string: \n  #{@cur_string.inspect}\n" 
 			end
 			s
 		end
 	end # SpanContext
 end end end end # module MaRuKu; module In; module Markdown; module SpanLevelParser
--- a/lib/maruku/input/rubypants.rb
+++ b/lib/maruku/input/rubypants.rb
@ -0,0 +1,225 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 #
 # NOTA BENE: 
 #
 # The following algorithm is a rip-off of RubyPants written by 
 # Christian Neukirchen. 
 #
 # RubyPants is a Ruby port of SmartyPants written by John Gruber.
 #
 # This file is distributed under the GPL, which I guess is compatible
 # with the terms of the RubyPants license.
 #
 # -- Andrea Censi
 # = RubyPants -- SmartyPants ported to Ruby
 #
 # Ported by Christian Neukirchen <mailto:chneukirchen@gmail.com>
 #   Copyright (C) 2004 Christian Neukirchen
 #
 # Incooporates ideas, comments and documentation by Chad Miller
 #   Copyright (C) 2004 Chad Miller
 #
 # Original SmartyPants by John Gruber
 #   Copyright (C) 2003 John Gruber
 #
 #
 # = RubyPants -- SmartyPants ported to Ruby
 #
 #
 # [snip]
 #
 # == Authors
 # 
 # John Gruber did all of the hard work of writing this software in
 # Perl for Movable Type and almost all of this useful documentation.
 # Chad Miller ported it to Python to use with Pyblosxom.
 #
 # Christian Neukirchen provided the Ruby port, as a general-purpose
 # library that follows the *Cloth API.
 # 
 #
 # == Copyright and License
 # 
 # === SmartyPants license:
 # 
 # Copyright (c) 2003 John Gruber
 # (http://daringfireball.net)
 # All rights reserved.
 # 
 # Redistribution and use in source and binary forms, with or without
 # modification, are permitted provided that the following conditions
 # are met:
 # 
 # * Redistributions of source code must retain the above copyright
 #   notice, this list of conditions and the following disclaimer.
 # 
 # * Redistributions in binary form must reproduce the above copyright
 #   notice, this list of conditions and the following disclaimer in
 #   the documentation and/or other materials provided with the
 #   distribution.
 # 
 # * Neither the name "SmartyPants" nor the names of its contributors
 #   may be used to endorse or promote products derived from this
 #   software without specific prior written permission.
 # 
 # This software is provided by the copyright holders and contributors
 # "as is" and any express or implied warranties, including, but not
 # limited to, the implied warranties of merchantability and fitness
 # for a particular purpose are disclaimed. In no event shall the
 # copyright owner or contributors be liable for any direct, indirect,
 # incidental, special, exemplary, or consequential damages (including,
 # but not limited to, procurement of substitute goods or services;
 # loss of use, data, or profits; or business interruption) however
 # caused and on any theory of liability, whether in contract, strict
 # liability, or tort (including negligence or otherwise) arising in
 # any way out of the use of this software, even if advised of the
 # possibility of such damage.
 # 
 # === RubyPants license
 # 
 # RubyPants is a derivative work of SmartyPants and smartypants.py.
 # 
 # Redistribution and use in source and binary forms, with or without
 # modification, are permitted provided that the following conditions
 # are met:
 # 
 # * Redistributions of source code must retain the above copyright
 #   notice, this list of conditions and the following disclaimer.
 # 
 # * Redistributions in binary form must reproduce the above copyright
 #   notice, this list of conditions and the following disclaimer in
 #   the documentation and/or other materials provided with the
 #   distribution.
 # 
 # This software is provided by the copyright holders and contributors
 # "as is" and any express or implied warranties, including, but not
 # limited to, the implied warranties of merchantability and fitness
 # for a particular purpose are disclaimed. In no event shall the
 # copyright owner or contributors be liable for any direct, indirect,
 # incidental, special, exemplary, or consequential damages (including,
 # but not limited to, procurement of substitute goods or services;
 # loss of use, data, or profits; or business interruption) however
 # caused and on any theory of liability, whether in contract, strict
 # liability, or tort (including negligence or otherwise) arising in
 # any way out of the use of this software, even if advised of the
 # possibility of such damage.
 # 
 #
 # == Links
 #
 # John Gruber:: http://daringfireball.net
 # SmartyPants:: http://daringfireball.net/projects/smartypants
 #
 # Chad Miller:: http://web.chad.org
 #
 # Christian Neukirchen:: http://kronavita.de/chris
 module MaRuKu; module In; module Markdown; module SpanLevelParser
 	Punct_class = '[!"#\$\%\'()*+,\-.\/:;<=>?\@\[\\\\\]\^_`{|}~]'
 	Close_class = %![^\ \t\r\n\\[\{\(\-]!
 	Rules = [
 		[/---/,   :mdash          ],
 		[/--/,    :ndash          ],
 		['...',   :hellip         ],
 		['. . .', :hellip         ],
 		["``",    :ldquo          ],
 		["''",    :rdquo          ],
 		[/<<\s/,  [:laquo, :nbsp] ],
 		[/\s>>/,  [:nbsp, :raquo] ],
 		[/<</,    :laquo          ],
 		[/>>/,    :raquo          ],
 #		def educate_single_backticks(str)
 #		["`", :lsquo]
 #		["'", :rsquo]
 		# Special case if the very first character is a quote followed by
 		# punctuation at a non-word-break. Close the quotes by brute
 		# force:
 		[/^'(?=#{Punct_class}\B)/, :rsquo],
 		[/^"(?=#{Punct_class}\B)/, :rdquo],
 		# Special case for double sets of quotes, e.g.:
 		#   <p>He said, "'Quoted' words in a larger quote."</p>
 		[/"'(?=\w)/, [:ldquo, :lsquo]    ],
 		[/'"(?=\w)/, [:lsquo, :ldquo]    ],
 		# Special case for decade abbreviations (the '80s):
 		[/'(?=\d\ds)/, :rsquo            ],
 		# Get most opening single quotes:
 		[/(\s)'(?=\w)/, [:one, :lsquo]   ],
 		# Single closing quotes:
 		[/(#{Close_class})'/, [:one, :rsquo]],
 		[/'(\s|s\b|$)/, [:rsquo, :one]],
 		# Any remaining single quotes should be opening ones:
 		[/'/, :lsquo],
 		# Get most opening double quotes:
 		[/(\s)"(?=\w)/, [:one, :ldquo]],
 		# Double closing quotes:
 		[/(#{Close_class})"/, [:one, :rdquo]],
 		[/"(\s|s\b|$)/, [:rdquo, :one]],
 		# Any remaining quotes should be opening ones:
 		[/"/, :ldquo]
 	].
 	map{|reg, subst| # People should do the thinking, machines should do the work.
 		reg = Regexp.new(Regexp.escape(reg)) if not reg.kind_of? Regexp
 		subst = [subst] if not subst.kind_of?Array
 		[reg, subst]}
 # note: input will be destroyed
 def apply_one_rule(reg, subst, input)
 	output = []
 	while first = input.shift
 		if first.kind_of?(String) && (m = reg.match(first))
 			output.push    m. pre_match if m. pre_match.size > 0
 			 input.unshift m.post_match if m.post_match.size > 0
 			subst.reverse.each do |x|
 				input.unshift( x == :one ? m[1] : md_entity(x.to_s) ) end
 		else
 			output.push first
 		end
 	end
 	return output
 end
 def educate(elements)
 	Rules.each do |reg, subst|
 		elements = apply_one_rule(reg, subst, elements)
 	end
 	# strips empty strings
 	elements.delete_if {|x| x.kind_of?(String) && x.size == 0}
 	final = []
 	# join consecutive strings
 	elements.each do |x|
 		if x.kind_of?(String) && final.last.kind_of?(String)
 			final.last << x
 		else
 			final << x
 		end
 	end
 	return final
 end
 end end end end
--- a/lib/maruku/input/type_detection.rb
+++ b/lib/maruku/input/type_detection.rb
@ -0,0 +1,141 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 class String
 	include MaRuKu::Strings
 	def md_type()
 		@md_type ||= line_md_type(self)
 	end
 end
 class NilClass
 	def md_type() nil end
 end
 # This code does the classification of lines for block-level parsing.
 module MaRuKu; module Strings
 	def line_md_type(l)
 		# The order of evaluation is important (:text is a catch-all)
 		return :text   if l =~ /^[a-zA-Z]/
 		return :code             if number_of_leading_spaces(l)>=4
 		return :empty    if l =~ /^\s*$/
 		return :footnote_text    if l =~ FootnoteText
 		return :ref_definition   if l =~ LinkRegex or l=~ IncompleteLink
 		return :abbreviation     if l =~ Abbreviation
 		return :definition       if l =~ Definition
 		# I had a bug with emails and urls at the beginning of the 
 		# line that were mistaken for raw_html
 		return :text     if l=~EMailAddress or l=~ URL
 		# raw html is like PHP Markdown Extra: at most three spaces before
 		return :xml_instr if l =~ %r{^\s*<\?}
 		return :raw_html if l =~ %r{^[ ]?[ ]?[ ]?</?\s*\w+}
 		return :raw_html if l =~ %r{[ ]{0,3}<\!\-\-}
 		return :ulist    if l =~ /^\s?([\*\-\+])\s+.*\w+/
 		return :olist    if l =~ /^\s?\d+\..*\w+/
 		return :header1  if l =~ /^(=)+/ 
 		return :header2  if l =~ /^([-\s])+$/ 
 		return :header3  if l =~ /^(#)+\s*\S+/ 
 		# at least three asterisks on a line, and only whitespace
 		return :hrule    if l =~ /^(\s*\*\s*){3,1000}$/ 
 		return :hrule    if l =~ /^(\s*-\s*){3,1000}$/ # or hyphens
 		return :hrule    if l =~ /^(\s*_\s*){3,1000}$/ # or underscores	
 		return :quote    if l =~ /^>/
 		return :metadata if l =~ /^@/
 #		if @@new_meta_data?
 			return :ald   if l =~ AttributeDefinitionList
 			return :ial   if l =~ InlineAttributeList
 #		end
 #		return :equation_end if l =~ EquationEnd
 		return :text # else, it's just text
 	end
 	# $1 = id   $2 = attribute list
 	AttributeDefinitionList = /^\s{0,3}\{([\w\d\s]+)\}:\s*(.*)\s*$/
 	# 
 	InlineAttributeList = /^\s{0,3}\{(.*)\}\s*$/
 	# Example:
 	#     ^:blah blah
 	#     ^: blah blah
 	#     ^   : blah blah
 	Definition = %r{ 
 		^ # begin of line
 		[ ]{0,3} # up to 3 spaces
 		: # colon
 		\s* # whitespace
 		(\S.*) # the text    = $1
 		$ # end of line
 	}x
 	# Example:
 	#     *[HTML]: Hyper Text Markup Language
 	Abbreviation = %r{
 		^  # begin of line
 		\* # one asterisk
 		\[ # opening bracket
 		([^\]]+) # any non-closing bracket:  id = $1
 		\] # closing bracket
 		:  # colon
 		\s* # whitespace
 		(\S.*\S)* #           definition=$2
 		\s* # strip this whitespace
 		$   # end of line
 	}x
 	FootnoteText = %r{
 		^\s*\[(\^.+)\]: # id = $1 (including '^')
 		\s*(\S.*)?$    # text = $2 (not obb.)
 	}x
 	# This regex is taken from BlueCloth sources
 	# Link defs are in the form: ^[id]: \n? url "optional title"
 	LinkRegex = %r{
 		^[ ]*\[([^\]]+)\]:		# id = $1
 		  [ ]*
 		<?(\S+)>?				# url = $2
 		  [ ]*
 		(?:# Titles are delimited by "quotes" or (parens).
 			["(']
 			(.+?)			# title = $3
 			[")']			# Matching ) or "
 			\s*(.+)?   # stuff = $4
 		)?	# title is optional
 	  }x
 	IncompleteLink = %r{^\s*\[(.+)\]:\s*$}
 	HeaderWithId = /^(.*)\{\#([\w_-]+)\}\s*$/
 	HeaderWithAttributes = /^(.*)\{(.*)\}\s*$/
 	# if contains a pipe, it could be a table header
 	MightBeTableHeader = %r{\|}
 	# -------------:
 	Sep = /\s*(\:)?\s*-+\s*(\:)?\s*/
 	# | -------------:| ------------------------------ |
 	TableSeparator = %r{^(\|?#{Sep}\|?)+\s*$}
 	EMailAddress = /<([^:]+@[^:]+)>/
 	URL = /^<http:/
 end end
--- a/lib/maruku/maruku.rb
+++ b/lib/maruku/maruku.rb
@ -0,0 +1,33 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 # The Maruku class is the public interface
 class Maruku
 	def initialize(s=nil, meta={})
 		super(nil)
 		self.attributes.merge! meta
 		if s
 			parse_doc(s)
 		end
 	end
 end
--- a/lib/maruku/output/to_html.rb
+++ b/lib/maruku/output/to_html.rb
@ -0,0 +1,689 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 require 'rexml/document'
 require 'rubygems'
 require 'syntax'
 require 'syntax/convertors/html'
 class String
 	# A string is rendered into HTML by creating
 	# a REXML::Text node. REXML takes care of all the encoding.
 	def to_html
 		REXML::Text.new(self)
 	end
 end
 class REXML::Element
 	# We only want to output the children in Maruku::to_html
 	 public :write_children 
 end
 # This module groups all functions related to HTML export.
 module MaRuKu; module Out; module HTML
 	include REXML
 	# Render as an HTML fragment (no head, just the content of BODY). (returns a string)
 	def to_html(context={})
 		indent = context[:indent] || -1
 		ie_hack = context[:ie_hack] ||true
 		div = Element.new 'dummy'
 			children_to_html.each do |e|
 				div << e
 			end
 			# render footnotes
 			if @doc.footnotes_order.size > 0
 				div << render_footnotes
 			end
 		doc = Document.new(nil,{:respect_whitespace =>:all})
 		doc << div
 		# REXML Bug? if indent!=-1 whitespace is not respected for 'pre' elements
 		# containing code.
 		xml =""
 		div.write_children(xml,indent,transitive=true,ie_hack)
 		xml
 	end
 	# Render to a complete HTML document (returns a string)
 	def to_html_document(context={})
 		indent = context[:indent] || -1
 		ie_hack = context[:ie_hack] ||true
 		doc = to_html_document_tree
 		xml  = "" 
 		# REXML Bug? if indent!=-1 whitespace is not respected for 'pre' elements
 		# containing code.
 		doc.write(xml,indent,transitive=true,ie_hack);
 		xhtml10strict  = "
 <?xml version='1.0' encoding='utf-8'?>
 <!DOCTYPE html PUBLIC '-//W3C//DTD XHTML 1.0 Strict//EN'
 'http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd'>\n"
 		xhtml11strict_mathml2 = '<?xml version="1.0" encoding="utf-8"?>
 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.1 plus MathML 2.0//EN"
               "http://www.w3.org/TR/MathML2/dtd/xhtml-math11-f.dtd" [
  <!ENTITY mathml "http://www.w3.org/1998/Math/MathML">
 ]>
 '
 xhtml11_mathml2_svg11 = 
 '<?xml version="1.0" encoding="utf-8"?>
 <!DOCTYPE html PUBLIC
    "-//W3C//DTD XHTML 1.1 plus MathML 2.0 plus SVG 1.1//EN"
    "http://www.w3.org/2002/04/xhtml-math-svg/xhtml-math-svg.dtd">
 '
 		xhtml11_mathml2_svg11 + xml
 	end
 	def xml_newline() Text.new("\n") end
 	# Render to a complete HTML document (returns a REXML document tree)
 	def to_html_document_tree
 		doc = Document.new(nil,{:respect_whitespace =>:all})
 	#	doc << XMLDecl.new
 		root = Element.new('html', doc)
 		root.add_namespace('http://www.w3.org/1999/xhtml')
 		root.add_namespace('svg', "http://www.w3.org/2000/svg" )
 		lang = self.attributes[:lang] || 'en'
 		root.attributes['xml:lang'] = lang
 		root << xml_newline
 		head = Element.new 'head', root
 			#<META HTTP-EQUIV="Content-Type" CONTENT="text/html; charset=utf-8">
 			me = Element.new 'meta', head
 			me.attributes['http-equiv'] = 'Content-type'
 #			me.attributes['content'] = 'text/html;charset=utf-8'	
 			me.attributes['content'] = 'application/xhtml+xml;charset=utf-8'	
 			# Create title element
 			doc_title = self.attributes[:title] || self.attributes[:subject] || ""
 			title = Element.new 'title', head
 				title << Text.new(doc_title)
 			if css_list = self.attributes[:css]
 				css_list.split.each do |css|
 				# <link type="text/css" rel="stylesheet" href="..." />
 				link = Element.new 'link'
 				link.attributes['type'] = 'text/css'
 				link.attributes['rel'] = 'stylesheet'
 				link.attributes['href'] = css
 				head << link 
 				head << xml_newline
 				end
 			end
 		root << xml_newline
 		body = Element.new 'body'
 			children_to_html.each do |e|
 				body << e
 			end
 			# render footnotes
 			if @doc.footnotes_order.size > 0
 				body << render_footnotes
 			end
 			# When we are rendering a whole document, we add a signature 
 			# at the bottom. 
 			if get_setting(:maruku_signature)
 				body << maruku_html_signature 
 			end
 		root << body
 		doc
 	end
 	# returns "st","nd","rd" or "th" as appropriate
 	def day_suffix(day)
 		s = {
 			1 => 'st',
 			2 => 'nd',
 			3 => 'rd',
 			21 => 'st',
 			22 => 'nd',
 			23 => 'rd',
 			31 => 'st'
 		}
 		return s[day] || 'th';
 	end
 	# formats a nice date
 	def nice_date
 		t = Time.now
 		t.strftime(" at %H:%M on ")+
 		t.strftime("%A, %B %d")+
 		day_suffix(t.day)+
 		t.strftime(", %Y")
 	end
 	def maruku_html_signature		
 		div = Element.new 'div'
 			div.attributes['class'] = 'maruku_signature'
 			Element.new 'hr', div
 			span = Element.new 'span', div
 				span.attributes['style'] = 'font-size: small; font-style: italic'
 				span << Text.new('Created by ')
 				a = Element.new('a', span)
 					a.attributes['href'] = 'http://maruku.rubyforge.org'
 					a.attributes['title'] = 'Maruku: a Markdown-superset interpreter for Ruby'
 					a << Text.new('Maruku')
 				span << Text.new(nice_date+".")
 		div
 	end
 	def render_footnotes
 		div = Element.new 'div'
 		div.attributes['class'] = 'footnotes'
 		div <<  Element.new('hr')
 			ol = Element.new 'ol'
 			@doc.footnotes_order.each_with_index do |fid, i| num = i+1
 				f = self.footnotes[fid]
 				if f
 					li = f.wrap_as_element('li')
 					li.attributes['id'] = "fn:#{num}"
 					a = Element.new 'a'
 						a.attributes['href'] = "#fnref:#{num}"
 						a.attributes['rev'] = 'footnote'
 						a<< Text.new('&#8617;', true, nil, true)
 					li.insert_after(li.children.last, a)
 					ol << li
 				else
 					maruku_error"Could not find footnote '#{fid}'"
 				end
 			end
 		div << ol
 		div
 	end
 	def to_html_hrule; create_html_element 'hr' end
 	def to_html_linebreak; Element.new 'br' end
 	# renders children as html and wraps into an element of given name
 	# 
 	# Sets 'id' if meta is set
 	def wrap_as_element(name, attributes_to_copy=[])
 		m = create_html_element(name, attributes_to_copy)
 			children_to_html.each do |e| m << e; end
 #			m << Comment.new( "{"+self.al.to_md+"}") if not self.al.empty?
 #			m << Comment.new( @attributes.inspect) if not @attributes.empty?
 		m
 	end
 	StandardAttributes = [:id, :style, :class]
 	def create_html_element(name, attributes_to_copy=[])
 		m = Element.new name
 			(StandardAttributes+attributes_to_copy).each do |a|
 				if v = @attributes[a] then m.attributes[a.to_s] = v.to_s end
 			end
 		m
 	end
 	def to_html_ul
 		if @attributes[:toc]
 			# render toc
 			html_toc = @doc.toc.to_html
 			return html_toc
 		else
 			add_ws  wrap_as_element('ul')               
 		end
 	end
 	def to_html_paragraph; add_ws wrap_as_element('p')                end
 	def to_html_ol;        add_ws wrap_as_element('ol')        end
 	def to_html_li;        add_ws wrap_as_element('li')        end
 	def to_html_li_span;   add_ws wrap_as_element('li')        end
 	def to_html_quote;     add_ws wrap_as_element('blockquote')  end
 	def to_html_strong;    wrap_as_element('strong')           end
 	def to_html_emphasis;  wrap_as_element('em')               end
 	# nil if not applicable, else string
 	def section_number
 		return nil if not @doc.attributes[:use_numbered_headers]
 		n = @attributes[:section_number]
 		if n && (not n.empty?)
 			 n.join('.')+". "
 		else
 			nil
 		end
 	end
 	# nil if not applicable, else SPAN element
 	def render_section_number
 		# if we are bound to a section, add section number
 		if num = section_number
 			span = Element.new 'span'
 			span.attributes['class'] = 'maruku_section_number'
 			span << Text.new(section_number)
 			span
 		else
 			nil
 		end
 	end
 	def to_html_header
 		element_name = "h#{self.level}" 
 		h = wrap_as_element element_name
 		if span = render_section_number
 			h.insert_before(h.children.first, span)
 		end
 		add_ws h
 	end
 	def source2html(source)
 		source = source.gsub(/&/,'&amp;')
 		source = Text.normalize(source)
 		Text.new(source, true, nil, false )
 	end
 =begin maruku_doc
 Attribute: html_use_syntax
 Scope: document
 Output: html
 Summary: Enables the use of the `syntax` package.
 Related: lang, code_lang
 Default: <?mrk Globals[:html_use_syntax].to_s ?>
 If false, Maruku does not append a signature to the
 generated file.
 =end
 	def to_html_code; 
 		source = self.raw_code
 		lang = self.attributes[:lang] || @doc.attributes[:code_lang] 
 		lang = 'xml' if lang=='html'
 		use_syntax = get_setting :html_use_syntax
 		element = 
 		if use_syntax && lang
 			begin
 				convertor = Syntax::Convertors::HTML.for_syntax lang
 				# eliminate trailing newlines otherwise Syntax crashes
 				source = source.gsub(/\n*\Z/,'')
 				html = convertor.convert( source )
 				pre = Document.new(html, {:respect_whitespace =>:all}).root
 				pre.attributes['class'] = lang
 				pre
 			rescue Object => e
 				maruku_error"Error while using the syntax library for code:\n#{source.inspect}"+
 				 "Lang is #{lang} object is: \n"+
 				  self.inspect + 
 				"\nException: #{e.class}: #{e.message}\n\t#{e.backtrace.join("\n\t")}"
 				tell_user("Using normal PRE because the syntax library did not work.")
 				to_html_code_using_pre(source)
 			end
 		else
 			to_html_code_using_pre(source)
 		end
 		color = get_setting(:code_background_color)
 		if color != Globals[:code_background_color]
 			element.attributes['style'] = "background-color: #{color};"
 		end
 		element
 	end
 	def to_html_code_using_pre(source)
 		pre = create_html_element  'pre'
 		code = Element.new 'code', pre
 		s = source
 		s  = s.gsub(/&/,'&amp;')
 		s = Text.normalize(s)
 		s  = s.gsub(/\&apos;/,'&#39;') # IE bug
 		s  = s.gsub(/'/,'&#39;') # IE bug
 		if get_setting(:code_show_spaces) 
 			# 187 = raquo
 			# 160 = nbsp
 			# 172 = not
 			s.gsub!(/\t/,'&#187;'+'&#160;'*3)
 			s.gsub!(/ /,'&#172;')
 		end
 		text = Text.new(s, respect_ws=true, parent=nil, raw=true )
 		code << text
 		pre
 	end
 	def to_html_inline_code; 
 		pre =  create_html_element 'code'
 			source = self.raw_code
 			pre << source2html(source) 
 			color = get_setting(:code_background_color)
 			if color != Globals[:code_background_color]
 				pre.attributes['style'] = "background-color: #{color};"
 			end
 		pre
 	end
 	def to_html_immediate_link
 		a =  create_html_element 'a'
 		url = self.url
 		text = url.gsub(/^mailto:/,'') # don't show mailto
 		a << Text.new(text)
 		a.attributes['href'] = url
 		a
 	end
 	def to_html_link
 		a =  wrap_as_element 'a'
 		id = self.ref_id
 		# if empty, use text
 		if id.size == 0
 			id = children.to_s.downcase
 		end
 		if ref = @doc.refs[id]
 			url = ref[:url]
 			title = ref[:title]
 			a.attributes['href'] = url if url
 			a.attributes['title'] = title if title
 		else
 			maruku_error"Could not find ref_id = #{id.inspect} for #{self.inspect}"
 			tell_user "Not creating a link for ref_id = #{id.inspect}."
 			return wrap_as_element('span')
 		end
 		return a
 	end
 	def to_html_im_link
 		if url = self.url
 			title = self.title
 			a =  wrap_as_element 'a'
 			a.attributes['href'] = url
 			a.attributes['title'] = title if title
 			return a
 		else
 			maruku_error"Could not find url in #{self.inspect}"
 			tell_user "Not creating a link for ref_id = #{id.inspect}."
 			return wrap_as_element('span')
 		end
 	end
 	def add_ws(e)
 		[Text.new("\n"), e, Text.new("\n")]
 	end
 ##### Email address
 	def obfuscate(s)
 		res = ''
 		s.each_byte do |char|
 			res +=  "&#%03d;" % char
 		end
 		res
 	end
 	def to_html_email_address
 		email = self.email
 		a = create_html_element 'a'
 			#a.attributes['href'] = Text.new("mailto:"+obfuscate(email),false,nil,true)
 			#a.attributes.add Attribute.new('href',Text.new(
 			#"mailto:"+obfuscate(email),false,nil,true))
 			# Sorry, for the moment it doesn't work
 			a.attributes['href'] = "mailto:#{email}"
 			a << Text.new(obfuscate(email),false,nil,true)
 		a
 	end
 ##### Images
 	def to_html_image
 		a =  create_html_element 'img'
 		id = self.ref_id
 		if ref = @doc.refs[id]
 			url = ref[:url]
 			title = ref[:title]
 			a.attributes['src'] = url.to_s
 			a.attributes['alt'] = title.to_s
 			[:title, :class, :style].each do |s| 
 				a.attributes[s.to_s] = ref[s] if ref[s]
 			end
 		else
 			maruku_error"Could not find id = #{id.inspect} for\n #{self.inspect}"
 			tell_user "Could not create image with ref_id = #{id.inspect};"+
 				 +" Using SPAN element as replacement."
 				return wrap_as_element('span')
 		end
 		return a
 	end
 	def to_html_im_image
 		if not url = self.url
 			maruku_error"Image with no url: #{self.inspect}"
 			tell_user "Could not create image with ref_id = #{id.inspect};"+
 			 +" Using SPAN element as replacement."
 			return wrap_as_element('span')
 		end
 		title = self.title
 		a =  create_html_element 'img'
 			a.attributes['src'] = url
 			a.attributes['alt'] = title.to_s
 		return a
 	end
 	def to_html_raw_html
 		raw_html = self.raw_html
 		if rexml_doc = @parsed_html
 			root = rexml_doc.root
 			if root.nil?
 				s = "Bug in REXML: root() of Document is nil: \n#{rexml_doc.inspect}\n"+
 				"Raw HTML:\n#{raw_html.inspect}"
 				maruku_error s
 				tell_user 'The REXML version you have has a bug, omitting HTML'
 				div = Element.new 'div'
 				#div << Text.new(s)
 				return div
 			end
 			# copies the @children array (FIXME is it deep?)
 			elements =  root.to_a 
 			return elements
 		else # invalid
 			# Creates red box with offending HTML
 			tell_user "Wrapping bad html in a PRE with class 'markdown-html-error'\n"+
 				add_tabs(raw_html,1,'|')
 			pre = Element.new('pre')
 			pre.attributes['style'] = 'border: solid 3px red; background-color: pink'
 			pre.attributes['class'] = 'markdown-html-error'
 			pre << Text.new("HTML parse error: \n#{raw_html}", true)
 			return pre
 		end
 	end
 	def to_html_abbr
 		abbr = Element.new 'abbr'
 		abbr << Text.new(children[0])
 		abbr.attributes['title'] = self.title if self.title
 		abbr
 	end
 	def to_html_footnote_reference
 		id = self.footnote_id
 		# save the order of used footnotes
 		order = @doc.footnotes_order
 		# take next number
 		order << id
 		num = order.size; 
 		sup = Element.new 'sup'
 		sup.attributes['id'] = "fnref:#{num}"
 			a = Element.new 'a'
 			a << Text.new(num.to_s)
 			a.attributes['href'] = "\#fn:#{num}"
 			a.attributes['rel'] = 'footnote'
 		sup << a
 		sup
 	end
 ## Definition lists ###
 	def to_html_definition_list() add_ws wrap_as_element('dl') end
 	def to_html_definition() children_to_html end
 	def to_html_definition_term() add_ws wrap_as_element('dt') end
 	def to_html_definition_data() add_ws wrap_as_element('dd') end	
 	# FIXME: Ugly code
 	def to_html_table
 		align = self.align
 		num_columns = align.size
 		head = @children.slice(0, num_columns)
 		rows = []
 		i = num_columns
 		while i<@children.size
 			rows << @children.slice(i, num_columns)
 			i += num_columns
 		end
 		table = create_html_element 'table'
 			thead = Element.new 'thead'
 			tr = Element.new 'tr'
 				array_to_html(head).each do |x| tr<<x end
 			thead << tr
 			table << thead
 			tbody = Element.new 'tbody'
 			rows.each do |row|
 				tr = Element.new 'tr'
 					array_to_html(row).each_with_index do |x,i| 
 						x.attributes['style'] ="text-align: #{align[i].to_s};" 
 						tr<<x 
 					end
 				tbody << tr << Text.new("\n")
 			end
 			table << tbody
 		table
 	end
 	def to_html_head_cell; wrap_as_element('th') end
 	def to_html_cell
 		if @attributes[:scope]
 			wrap_as_element('th', [:scope])
 		else
 			wrap_as_element('td')
 		end
 	end
 	def to_html_entity 
 		MaRuKu::Out::Latex.need_entity_table
 		entity_name = self.entity_name
 		if (e = MaRuKu::Out::Latex::ENTITY_TABLE[entity_name]) && e.html_num
 			entity_name = e.html_num
 		end
 		# Fix for Internet Explorer
 		if entity_name == 'apos'
 			entity_name = 39
 		end
 		if entity_name.kind_of? Fixnum
 #			Entity.new(entity_name)
 			Text.new('&#%d;' % [entity_name],  false, nil, true)
 		else
 			Text.new('&%s;' % [entity_name])
 		end
 	end
 	def to_html_xml_instr
 		target = self.target || ''
 		code = self.code || ''
 		REXML::Instruction.new(target, code)
 	end
 	# Convert each child to html
 	def children_to_html
 		array_to_html(@children)
 	end
 	def array_to_html(array)
 		e = []
 		array.each do |c|
 			method = c.kind_of?(MDElement) ? 
 			   "to_html_#{c.node_type}" : "to_html"
 			if not c.respond_to?(method)
 				#raise "Object does not answer to #{method}: #{c.class} #{c.inspect}"
 				next
 			end
 			h =  c.send(method)
 			if h.nil?
 				raise "Nil html created by method  #{method}:\n#{h.inspect}\n"+
 				" for object #{c.inspect[0,300]}"
 			end
 			if h.kind_of?Array
 				e = e + h #h.each do |hh| e << hh end
 			else
 				e << h
 			end
 		end
 		e
 	end
 	def to_html_ref_definition; [] end
 	def to_latex_ref_definition; [] end
 end # HTML
 end # out
 end # MaRuKu
--- a/lib/maruku/output/to_latex.rb
+++ b/lib/maruku/output/to_latex.rb
@ -0,0 +1,538 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 module MaRuKu
 class MDDocument
 	Latex_preamble_enc_cjk = 
 "\\usepackage[C40]{fontenc}
 \\usepackage[cjkjis]{ucs}
 \\usepackage[utf8x]{inputenc}"
 	Latex_preamble_enc_utf8 = 
 "\\usepackage{ucs}
 \\usepackage[utf8x]{inputenc}"
 	def latex_require_package(p)
 		if not self.latex_required_packages.include? p
 			self.latex_required_packages.push p
 		end
 	end
 	# Render as a LaTeX fragment 
 	def to_latex
 		children_to_latex
 	end
 =begin maruku_doc
 Attribute: maruku_signature
 Scope: document
 Output: html, latex
 Summary: Enables Maruku's signature.
 Default: true
 If false, Maruku does not append a signature to the
 generated file.
 =end
 	# Render as a complete LaTeX document 
 	def to_latex_document
 		body = to_latex
 		if get_setting(:maruku_signature)
 			body += render_latex_signature 
 		end
 		required = 
 		self.latex_required_packages.map {|p|
 			"\\usepackage{#{p}}\n"
 		}.join
 =begin maruku_doc
 Attribute: latex_cjk
 Scope:     document
 Output:    latex
 Summary:   Support for CJK characters.
 If the `latex_cjk` attribute is specified, then appropriate headers
 are added to the LaTeX preamble to support Japanese fonts.
 You have to have these fonts installed -- and this can be a pain.
 If `latex_cjk` is specified, this is added to the preamble:
 <?mrk md_codeblock(Maruku::MDDocument::Latex_preamble_enc_cjk) ?>
 while the default is to add this:
 <?mrk md_codeblock(Maruku::MDDocument::Latex_preamble_enc_utf8) ?>
 =end
 		encoding = @doc.attributes[:latex_cjk] ? 
 			Latex_preamble_enc_cjk : Latex_preamble_enc_utf8
 =begin maruku_doc
 Attribute: latex_preamble
 Scope:     document
 Output:    latex
 Summary:   User-defined preamble.
 If the `latex_preamble` attribute is specified, then its value
 will be used as a custom preamble. 
 For example:
 	Title: My document
 	Latex preamble: preamble.tex
 will produce:
 	...
 	\input{preamble.tex}
 	...
 =end
 	user_preamble = (file = @doc.attributes[:latex_preamble]) ?
 		"\\input{#{file}}\n" : ""
 "\\documentclass{article}
 % Packages  required to support encoding
 #{encoding}
 % Packages  required by code
 #{required}
 % Packages  always used
 \\usepackage{hyperref}
 \\usepackage{xspace}
 \\usepackage[usenames,dvipsnames]{color}
 \\usepackage[margin=1in]{geometry}
 \\hypersetup{colorlinks=true,urlcolor=blue}
 #{user_preamble}
 \\begin{document} 
 #{body}
 \\end{document}
 "	
 	end
 	def render_latex_signature
 "\\vfill
 \\hrule
 \\vspace{1.2mm}
 \\begin{tiny}
 Created by \\href{http://maruku.rubyforge.org}{Maruku} #{self.nice_date}.
 \\end{tiny}"
 	end
 end end
 module MaRuKu; module Out; module Latex
 	def to_latex_hrule; "\n\\vspace{.5em} \\hrule \\vspace{.5em}\n" end
 	def to_latex_linebreak; "\\linebreak " end
 	def to_latex_paragraph 
 		children_to_latex+"\n\n"
 	end
 =begin maruku_doc
 Title: Input format for colors
 Output: latex, html
 Related: code_background_color
 Admissible formats:
 	green
 	#abc
 	#aabbcc
 =end
 	# \color[named]{name} 	
 	# \color[rgb]{1,0.2,0.3} 
 	def latex_color(s, command='color')
 		if s =~ /^\#(\w\w)(\w\w)(\w\w)$/
 			r = $1.hex; g = $2.hex; b=$3.hex
 			# convert from 0-255 to 0.0-1.0
 			r = r / 255.0; g = g / 255.0; b = b / 255.0; 
 			"\\#{command}[rgb]{%0.2f,%0.2f,%0.2f}" % [r,g,b]
 		elsif s =~ /^\#(\w)(\w)(\w)$/
 			r = $1.hex; g = $2.hex; b=$3.hex
 			# convert from 0-15 to 0.0-1.0
 			r = r / 15.0; g = g / 15.0; b = b / 15.0; 
 			"\\#{command}[rgb]{%0.2f,%0.2f,%0.2f}" % [r,g,b]
 		else	
 			"\\#{command}{#{s}}"
 		end
 	end
 	def to_latex_code;
 		raw_code = self.raw_code
 =begin maruku_doc
 Attribute: latex_use_listings
 Scope: document
 Output: latex
 Summary: Support for `listings` package.
 Related: code_show_spaces, code_background_color, lang, code_lang
 If the `latex_use_listings` attribute is specified, then 
 code block are rendered using the `listings` package.
 Otherwise, a standard `verbatim` environment is used.
 *	If the `lang` attribute for the code block has been specified,
 	it gets passed to the `listings` package using the `lstset` macro.
 	The default lang for code blocks is specified through 
 	the `code_lang` attribute.
 		\lstset{language=ruby}
 	Please refer to the documentation of the `listings` package for
 	supported languages.
 	If a language is not supported, the `listings` package will emit
 	a warning during the compilation. Just press enter and nothing
 	wrong will happen.
 *	If the `code_show_spaces` is specified, than spaces and tabs will
 	be shown using the macro:
 		\lstset{showspaces=true,showtabs=true}
 *	The background color is given by `code_background_color`.
 =end
 		if @doc.attributes[:latex_use_listings]
 			@doc.latex_require_package('listings')
 			s = "\\lstset{columns=fixed,frame=shadowbox}"
 			if get_setting(:code_show_spaces) 
 				s+= "\\lstset{showspaces=true,showtabs=true}\n"
 			else
 				s+= "\\lstset{showspaces=false,showtabs=false}\n"
 			end
 			color = latex_color get_setting(:code_background_color)
 			s+= "\\lstset{backgroundcolor=#{color}}\n" 
 			s+= "\\lstset{basicstyle=\\ttfamily\\footnotesize}\n" 
 			lang = self.attributes[:lang] || @doc.attributes[:code_lang] || '{}'
 			if lang
 				s += "\\lstset{language=#{lang}}\n"
 			end
 			"#{s}\n\\begin{lstlisting}\n#{raw_code}\n\\end{lstlisting}"
 		else
 			"\\begin{verbatim}#{raw_code}\\end{verbatim}\n"
 		end
 	end
 	TexHeaders = {
 		1=>'section',
 		2=>'subsection',
 		3=>'subsubsection',
 		4=>'paragraph'}
 	def to_latex_header
 		h = TexHeaders[self.level] || 'paragraph'
 		title = children_to_latex
 		if number = section_number
 			title = number + title
 		end
 		if id = self.attributes[:id]
 			# drop '#' at the beginning
 			if id[0,1] == '#' then id = [1,id.size] end
 			%{\\hypertarget{%s}{}\\%s*{{%s}}\\label{%s}\n\n} % [ id, h, title, id ]
 		else
 			%{\\%s*{%s}\n\n} % [ h, title]
 		end
 	end
 	def to_latex_ul;       
 		if self.attributes[:toc]
 			@doc.toc.to_latex
 		else
 			wrap_as_environment('itemize')
 		end
 	end
 	def to_latex_quote;        wrap_as_environment('quote')               end
 	def to_latex_ol;        wrap_as_environment('enumerate')               end
 	def to_latex_li;        
 		"\\item #{children_to_latex}\n"  
 	end
 	def to_latex_li_span;
 		"\\item #{children_to_latex}\n"
 	end
 	def to_latex_strong
 		"\\textbf{#{children_to_latex}}"
 	end
 	def to_latex_emphasis
 		"\\emph{#{children_to_latex}}"
 	end
 	def wrap_as_span(c)
 		"{#{c} #{children_to_latex}}"
 	end
 	def wrap_as_environment(name)
 "\\begin{#{name}}%
 #{children_to_latex}
 \\end{#{name}}\n"	
 	end
 	SAFE_CHARS = Set.new([?\ ] + (?a..?z).to_a + (?A..?Z).to_a)
 	# the ultimate escaping
 	# (is much better than using \verb)
 	def latex_escape(source)
 		s=""; 
 		source.each_byte do |b| 
 			if b == ?\ 
 				s << '~'
 			elsif SAFE_CHARS.include? b
 				s << b
 			else
 				s += "\\char%d" % b 
 			end
 		end
 		s
 	end
 	def to_latex_inline_code; 
 		source = self.raw_code
 		# Convert to printable latex chars 
 		s = latex_escape(source)
 		color = get_setting(:code_background_color)
 		colorspec = latex_color(color, 'colorbox')
 		"#{colorspec}{\\tt #{s}}"
 	end
 	def to_latex_immediate_link
 		a =  create_html_element 'a'
 		url = self.url
 		text = url.gsub(/^mailto:/,'') # don't show mailto
 #			gsub('~','$\sim$')
 		text = latex_escape(text)
 		if url[0,1] == '#'
 			url = url[1,url.size]
 			return "\\hyperlink{#{url}}{#{text}}"
 		else
 			return "\\href{#{url}}{#{text}}"
 		end
 	end
 	def to_latex_im_link
 		url = self.url
 		if url[0,1] == '#'
 			url = url[1,url.size]
 			return "\\hyperlink{#{url}}{#{children_to_latex}}"
 		else
 			return "\\href{#{url}}{#{children_to_latex}}"
 		end
 	end
 	def to_latex_link
 		id = self.ref_id
 		# if empty, use text
 		if id.size == 0
 			id = children.to_s.downcase
 		end
 		ref = @doc.refs[id]
 		if not ref
 			$stderr.puts "Could not find id = '#{id}'"
 			return children_to_latex
 		else
 			url = ref[:url]
 			#title = ref[:title] || 'no title'
 			if url[0,1] == '#'
 				url = url[1,url.size]
 				return "\\hyperlink{#{url}}{#{children_to_latex}}"
 			else
 				return "\\href{#{url}}{#{children_to_latex}}"
 			end
 		end
 	end
 	def to_latex_email_address
 		email = self.email
 		"\\href{mailto:#{email}}{#{latex_escape(email)}}"
 	end
 	def to_latex_table
 		align = self.align
 		num_columns = align.size
 		head = @children.slice(0, num_columns)
 		rows = []
 		i = num_columns
 		while i<@children.size
 			rows << @children.slice(i, num_columns)
 			i+=num_columns
 		end
 		h = {:center=>'c',:left=>'l',:right=>'r'}
 		align_string = align.map{|a| h[a]}.join('|')
 		s = "\\begin{tabular}{#{align_string}}\n"
 			s += array_to_latex(head, '&') + "\\\\" +"\n"
 			s += "\\hline \n"
 			rows.each do |row|
 				s += array_to_latex(row, '&') + "\\\\" +"\n"
 			end
 		s += "\\end{tabular}"
 		# puts table in its own paragraph
 		s += "\n\n"
 		s
 	end
 	def to_latex_head_cell; children_to_latex end
 	def to_latex_cell; children_to_latex end
 	def to_latex_footnote_reference
 		id = self.footnote_id
 		f = @doc.footnotes[id]
 		if f
 			"\\footnote{#{f.children_to_latex.strip}} "
 		else
 			$stderr.puts "Could not find footnote '#{fid}'"
 		end
 	end
 	def to_latex_raw_html
 		#'{\bf Raw HTML removed in latex version }'
 		""
 	end
 	## Definition lists ###
 	def to_latex_definition_list
 		s = "\\begin{description}\n"
 		s += children_to_latex
 		s += "\\end{description}\n"
 		s
 	end
 	def to_latex_definition		
 		terms = self.terms
 		definitions = self.definitions
 		s = ""
 		terms.each do |t|
 			s +="\n\\item[#{t.children_to_latex}] "
 		end
 		definitions.each do |d|
 			s += "#{d.children_to_latex} \n"
 		end
 		s
 	end
 	def to_latex_abbr
 		children_to_latex
 	end
 	def to_latex_image
 		id = self.ref_id
 		ref = @doc.refs[id]
 		if not ref
 			$stderr.puts "Could not find id = '#{id}'"
 			""
 		else
 			url = ref[:url]
 			"{\\bf Images not supported yet (#{latex_escape(url)})}"
 		end
 	end
 	# Convert each child to html
 	def children_to_latex
 		array_to_latex(@children)
 	end
 	def array_to_latex(array, join_char='')
 		e = []
 		array.each do |c|
 			method = c.kind_of?(MDElement) ? 
 			   "to_latex_#{c.node_type}" : "to_latex"
 			if not c.respond_to?(method)
 		#		raise "Object does not answer to #{method}: #{c.class} #{c.inspect[0,100]}"
 				next
 			end
 			h =  c.send(method)
 			if h.nil?
 				raise "Nil html for #{c.inspect} created with method #{method}"
 			end
 			if h.kind_of?Array
 				e = e + h
 			else
 				e << h
 			end
 		end
 		# puts a space after commands if needed
 		e.each_index do |i|
 			if e[i] =~ /\\\w+\s*$/ # command
 				if (s=e[i+1]) && s[0] == ?\ # space
 					e[i]  = e[i] + "\\ "
 				end
 			end
 		end
 		e.join(join_char)
 	end
 end end end # MaRuKu::Out::Latex
--- a/lib/maruku/output/to_latex_entities.rb
+++ b/lib/maruku/output/to_latex_entities.rb
@ -0,0 +1,367 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 require 'rexml/document'
 module MaRuKu; module Out; module Latex
 	include REXML
 	def to_latex_entity 
 		MaRuKu::Out::Latex.need_entity_table
 		entity_name = self.entity_name
 		entity = ENTITY_TABLE[entity_name]
 		if not entity
 			maruku_error "I don't know how to translate entity '#{entity_name}' "+
 			"to LaTeX."
 			return ""
 		end
 		replace = entity.latex_string
 		entity.latex_packages.each do |p|
 			@doc.latex_require_package p
 		end
 		if replace =~ /^\\/
 			replace = replace + " "
 		end
 		if replace
 			return replace
 		else
 			tell_user "Cannot translate entity #{entity_name.inspect} to LaTeX."
 			return entity_name
 		end
 	end
 	class LatexEntity
 		safe_attr_accessor :html_num, Fixnum
 		safe_attr_accessor :html_entity, String
 		safe_attr_accessor :latex_string, String
 		safe_attr_accessor :latex_packages, Array
 	end
 	def Latex.need_entity_table
 		Latex.init_entity_table if ENTITY_TABLE.empty?
 	end
 	# create hash @@entity_to_latex
 	def Latex.init_entity_table
 		$stderr.write "Creating entity table.."
 		$stderr.flush
 		doc = Document.new XML_TABLE
 		doc.elements.each("//char") do |c| 
 			num =  c.attributes['num'].to_i
 			name =  c.attributes['name']
 			package =  c.attributes['package']
 			convert =  c.attributes['convertTo']
 			convert.gsub!(/@DOUBLEQUOT/,'"')
 			convert.gsub!(/@QUOT/,"'")
 			convert.gsub!(/@GT/,">")
 			convert.gsub!(/@LT/,"<")
 			convert.gsub!(/@AMP/,"&")
 			convert.freeze
 			e = LatexEntity.new
 			e.html_num = num
 			e.html_entity = name
 			e.latex_string = convert
 			e.latex_packages = package ? package.split : []
 			ENTITY_TABLE[num] = e
 			ENTITY_TABLE[name] = e
 		end
 		$stderr.puts "..done."
 	end
 	ENTITY_TABLE = {}
 # The following is a conversion chart for html elements, courtesy of 
 # text2html 
 	XML_TABLE ="
 	<chars>
 	  <char num='913' name='Alpha' convertTo='$A$' />
 	  <char num='914' name='Beta' convertTo='$B$' />
 	  <char num='915' name='Gamma' convertTo='$\\Gamma$' />
 	  <char num='916' name='Delta' convertTo='$\\Delta$' />
 	  <char num='917' name='Epsilon' convertTo='$E$' />
 	  <char num='918' name='Zeta' convertTo='$Z$' />
 	  <char num='919' name='Eta' convertTo='$H$' />
 	  <char num='920' name='Theta' convertTo='$\\Theta$' />
 	  <char num='921' name='Iota' convertTo='$I$' />
 	  <char num='922' name='Kappa' convertTo='$K$' />
 	  <char num='923' name='Lambda' convertTo='$\\Lambda$' />
 	  <char num='924' name='Mu' convertTo='$M$' />
 	  <char num='925' name='Nu' convertTo='$N$' />
 	  <char num='926' name='Xi' convertTo='$\\Xi$' />
 	  <char num='927' name='Omicron' convertTo='$O$' />
 	  <char num='928' name='Pi' convertTo='$\\Pi$' />
 	  <char num='929' name='Rho' convertTo='$P$' />
 	  <char num='931' name='Sigma' convertTo='$\\Sigma$' />
 	  <char num='932' name='Tau' convertTo='$T$' />
 	  <char num='933' name='Upsilon' convertTo='$Y$' />
 	  <char num='934' name='Phi' convertTo='$\\Phi$' />
 	  <char num='935' name='Chi' convertTo='$X$' />
 	  <char num='936' name='Psi' convertTo='$\\Psi$' />
 	  <char num='937' name='Omega' convertTo='$\\Omega$' />
 	  <char num='945' name='alpha' convertTo='$\\alpha$' />
 	  <char num='946' name='beta' convertTo='$\\beta$' />
 	  <char num='947' name='gamma' convertTo='$\\gamma$' />
 	  <char num='948' name='delta' convertTo='$\\delta$' />
 	  <char num='949' name='epsilon' convertTo='$\\epsilon$' />
 	  <char num='950' name='zeta' convertTo='$\\zeta$' />
 	  <char num='951' name='eta' convertTo='$\\eta$' />
 	  <char num='952' name='theta' convertTo='$\\theta$' />
 	  <char num='953' name='iota' convertTo='$\\iota$' />
 	  <char num='954' name='kappa' convertTo='$\\kappa$' />
 	  <char num='955' name='lambda' convertTo='$\\lambda$' />
 	  <char num='956' name='mu' convertTo='$\\mu$' />
 	  <char num='957' name='nu' convertTo='$\\nu$' />
 	  <char num='958' name='xi' convertTo='$\\xi$' />
 	  <char num='959' name='omicron' convertTo='$o$' />
 	  <char num='960' name='pi' convertTo='$\\pi$' />
 	  <char num='961' name='rho' convertTo='$\\rho$' />
 	  <char num='963' name='sigma' convertTo='$\\sigma$' />
 	  <char num='964' name='tau' convertTo='$\\tau$' />
 	  <char num='965' name='upsilon' convertTo='$\\upsilon$' />
 	  <char num='966' name='phi' convertTo='$\\phi$' />
 	  <char num='967' name='chi' convertTo='$\\chi$' />
 	  <char num='968' name='psi' convertTo='$\\psi$' />
 	  <char num='969' name='omega' convertTo='$\\omega$' />
 	  <char num='962' name='sigmaf' convertTo='$\\varsigma$' />
 	  <char num='977' name='thetasym' convertTo='$\\vartheta$' />
 	  <char num='982' name='piv' convertTo='$\\varpi$' />
 	  <char num='8230' name='hellip' convertTo='\\ldots' />
 	  <char num='8242' name='prime' convertTo='$\\prime$' />
 	  <char num='8254' name='oline' convertTo='-' />
 	  <char num='8260' name='frasl' convertTo='/' />
 	  <char num='8472' name='weierp' convertTo='$\\wp$' />
 	  <char num='8465' name='image' convertTo='$\\Im$' />
 	  <char num='8476' name='real' convertTo='$\\Re$' />
 	  <char num='8501' name='alefsym' convertTo='$\\aleph$' />
 	  <char num='8226' name='bull' convertTo='$\\bullet$' />
 	  <char num='8482' name='trade' convertTo='$^{\\rm TM}$' /> <!-- \texttrademark -->
 	  <char num='8592' name='larr' convertTo='$\\leftarrow$' />
 	  <char num='8594' name='rarr' convertTo='$\\rightarrow$' />
 	  <char num='8593' name='uarr' convertTo='$\\uparrow$' />
 	  <char num='8595' name='darr' convertTo='$\\downarrow$' />
 	  <char num='8596' name='harr' convertTo='$\\leftrightarrow$' />
 	  <char num='8629' name='crarr' convertTo='$\\hookleftarrow$' />
 	  <char num='8657' name='uArr' convertTo='$\\Uparrow$' />
 	  <char num='8659' name='dArr' convertTo='$\\Downarrow$' />
 	  <char num='8656' name='lArr' convertTo='$\\Leftarrow$' />
 	  <char num='8658' name='rArr' convertTo='$\\Rightarrow$' />
 	  <char num='8660' name='hArr' convertTo='$\\Leftrightarrow$' />
 	  <char num='8704' name='forall' convertTo='$\\forall$' />
 	  <char num='8706' name='part' convertTo='$\\partial$' />
 	  <char num='8707' name='exist' convertTo='$\\exists$' />
 	  <char num='8709' name='empty' convertTo='$\\emptyset$' />
 	  <char num='8711' name='nabla' convertTo='$\\nabla$' />
 	  <char num='8712' name='isin' convertTo='$\\in$' />
 	  <char num='8715' name='ni' convertTo='$\\ni$' />
 	  <char num='8713' name='notin' convertTo='$\\notin$' />
 	  <char num='8721' name='sum' convertTo='$\\sum$' />
 	  <char num='8719' name='prod' convertTo='$\\prod$' />
 	  <char num='8722' name='minus' convertTo='$-$' />
 	  <char num='8727' name='lowast' convertTo='$\\ast$' />
 	  <char num='8730' name='radic' convertTo='$\\surd$' />
 	  <char num='8733' name='prop' convertTo='$\\propto$' />
 	  <char num='8734' name='infin' convertTo='$\\infty$' />
 	  <char num='8736' name='ang' convertTo='$\\angle$' />
 	  <char num='8743' name='and' convertTo='$\\wedge$' />
 	  <char num='8744' name='or' convertTo='$\\vee$' />
 	  <char num='8745' name='cup' convertTo='$\\cup$' />
 	  <char num='8746' name='cap' convertTo='$\\cap$' />
 	  <char num='8747' name='int' convertTo='$\\int$' />
 	  <char num='8756' name='there4' convertTo='$\\therefore$' package='amssymb' /> <!-- only AMS -->
 	  <char num='8764' name='sim' convertTo='$\\sim$' />
 	  <char num='8776' name='asymp' convertTo='$\\approx$' />
 	  <char num='8773' name='cong' convertTo='$\\cong$' />
 	  <char num='8800' name='ne' convertTo='$\\neq$' />
 	  <char num='8801' name='equiv' convertTo='$\\equiv$' />
 	  <char num='8804' name='le' convertTo='$\\leq$' />
 	  <char num='8805' name='ge' convertTo='$\\geq$' />
 	  <char num='8834' name='sub' convertTo='$\\subset$' />
 	  <char num='8835' name='sup' convertTo='$\\supset$' />
 <!--	  <char num='8838' name='sube' convertTo='$\\subseteq$' />-->
 	  <char num='8839' name='supe' convertTo='$\\supseteq$' />
 <!--	  <char num='8836' name='nsub' convertTo='$\\nsubset$'  /> <!-- only AMS -->
 	  <char num='8853' name='oplus' convertTo='$\\oplus$' />
 	  <char num='8855' name='otimes' convertTo='$\\otimes$' />
 	  <char num='8869' name='perp' convertTo='$\\perp$' />
 	  <char num='8901' name='sdot' convertTo='$\\cdot$' />
 	  <char num='8968' name='rceil' convertTo='$\\rceil$' />
 	  <char num='8969' name='lceil' convertTo='$\\lceil$' />
 	  <char num='8970' name='lfloor' convertTo='$\\lfloor$' />
 	  <char num='8971' name='rfloor' convertTo='$\\rfloor$' />
 	  <char num='9001' name='rang' convertTo='$\\rangle$' />
 	  <char num='9002' name='lang' convertTo='$\\langle$' />
 	  <char num='9674' name='loz' convertTo='$\\lozenge$' package='amssymb' /> <!-- only AMS -->
 	  <char num='9824' name='spades' convertTo='$\\spadesuit$' />
 	  <char num='9827' name='clubs' convertTo='$\\clubsuit$' />
 	  <char num='9829' name='hearts' convertTo='$\\heartsuit$' />
 	  <char num='9830' name='diams' convertTo='$\\diamondsuit$' />                                     
 	  <char num='38' name='amp' convertTo='\\@AMP' />    
 <!--	  <char num='34' name='quot' convertTo='\\@DOUBLEQUOT' />  XXX -->
 	<char num='34' name='quot' convertTo='\"' /> 
 	<char num='39' name='apos' convertTo=\"'\" /> 
 	  <char num='169' name='copy' convertTo='\\copyright' />
 	  <char num='60' name='lt' convertTo='$@LT$' />
 	  <char num='62' name='gt' convertTo='$@GT$' />
 	  <char num='338' name='OElig' convertTo='\\OE' />
 	  <char num='339' name='oelig' convertTo='\\oe' />
 	  <char num='352' name='Scaron' convertTo='\\v{S}' />
 	  <char num='353' name='scaron' convertTo='\\v{s}' />
 	  <char num='376' name='Yuml' convertTo='\\\"Y' />
 	  <char num='710' name='circ' convertTo='\\textasciicircum' />
 	  <char num='732' name='tilde' convertTo='\\textasciitilde' />
 	  <char num='8211' name='ndash' convertTo='--' />
 	  <char num='8212' name='mdash' convertTo='---' />
 	  <char num='8216' name='lsquo' convertTo='`' />
 	  <char num='8217' name='rsquo' convertTo=\"'\" /> <!-- XXXX -->
 	  <char num='8220' name='ldquo' convertTo='``' />
 	  <char num='8221' name='rdquo' convertTo=\"''\" /> <!-- XXXX -->
 	  <char num='8224' name='dagger' convertTo='\\dag' />
 	  <char num='8225' name='Dagger' convertTo='\\ddag' />
 	  <char num='8240' name='permil' convertTo='\\permil' package='wasysym' /> <!-- wasysym package -->
 	  <char num='8364' name='euro' convertTo='\\euro' package='eurosym' /> <!-- eurosym package -->
 	  <char num='8249' name='lsaquo' convertTo='\\guilsinglleft' package='aeguill'/>
 	  <char num='8250' name='rsaquo' convertTo='\\guilsinglright' package='aeguill' />
 <!--	  <char num='160' name='nbsp' convertTo='\\nolinebreak' />-->
 	  <char num='160' name='nbsp' convertTo='~' />
 	  <char num='161' name='iexcl' convertTo='\\textexclamdown' />
 	  <char num='163' name='pound' convertTo='\\pounds' />
 	  <char num='164' name='curren' convertTo='\\currency' package='wasysym' /> <!-- wasysym package -->
 	  <char num='165' name='yen' convertTo='\\textyen' package='textcomp'/> <!-- textcomp -->
 	  <char num='166' name='brvbar' convertTo='\\brokenvert' /> <!-- wasysym -->
 	  <char num='167' name='sect' convertTo='\\S' />
 	  <char num='171' name='laquo' convertTo='\\guillemotleft' package='aeguill'/>
 	  <char num='187' name='raquo' convertTo='\\guillemotright' package='aeguill'/>
 	  <char num='174' name='reg' convertTo='\\textregistered' />
 	  <char num='170' name='ordf' convertTo='\\textordfeminine' />
 	  <char num='172' name='not' convertTo='$\\neg$' />
 	<!--  <char num='176' name='deg' convertTo='$\\degree$' /> <!-- mathabx -->
 	  <char num='176' name='deg' convertTo='\\textdegree' package='textcomp'/>
 	  <char num='177' name='plusmn' convertTo='$\\pm$' />
 	  <char num='180' name='acute' convertTo='@QUOT' />
 	  <char num='181' name='micro' convertTo='$\\mu$' />
 	  <char num='182' name='para' convertTo='\\P' />
 	  <char num='183' name='middot' convertTo='$\\cdot$' />
 	  <char num='186' name='ordm' convertTo='\\textordmasculine' />
 	  <char num='162' name='cent' convertTo='\\cent' package='wasysym' /> 
 	  <char num='185' name='sup1' convertTo='$^1$' />
 	  <char num='178' name='sup2' convertTo='$^2$' />
 	  <char num='179' name='sup3' convertTo='$^3$' />
 	  <char num='189' name='frac12' convertTo='$\\frac{1}{2}$' />
 	  <char num='188' name='frac14' convertTo='$\\frac{1}{4}$' />
 	  <char num='190' name='frac34' convertTo='$\\frac{3}{4}$' />
 	  <char num='192' name='Agrave' convertTo='\\`A' />
 	  <char num='193' name='Aacute' convertTo='\\@QUOTA' />
 	  <char num='194' name='Acirc' convertTo='\\^A' />
 	  <char num='195' name='Atilde' convertTo='\\~A' />
 	  <char num='196' name='Auml' convertTo='\\@DOUBLEQUOTA' />
 	  <char num='197' name='Aring' convertTo='\\AA' />
 	  <char num='198' name='AElig' convertTo='\\AE' />
 	  <char num='199' name='Ccedil' convertTo='\\c{C}' />
 	  <char num='200' name='Egrave' convertTo='\\`E' />
 	  <char num='201' name='Eacute' convertTo='\\@QUOTE' />
 	  <char num='202' name='Ecirc' convertTo='\\^E' />
 	  <char num='203' name='Euml' convertTo='\\@DOUBLEQUOTE' />
 	  <char num='204' name='Igrave' convertTo='\\`I' />
 	  <char num='205' name='Iacute' convertTo='\\@QUOTI' />
 	  <char num='206' name='Icirc' convertTo='\\^I' />
 	  <char num='207' name='Iuml' convertTo='\\\"I' />
 	  <char num='208' name='ETH' convertTo='$\\eth$' /> <!-- AMS -->
 	  <char num='209' name='Ntilde' convertTo='\\~N' />    
 	  <char num='210' name='Ograve' convertTo='\\`O' />
 	  <char num='211' name='Oacute' convertTo='\\@QUOT O' />
 	  <char num='212' name='Ocirc' convertTo='\\^O' />
 	  <char num='213' name='Otilde' convertTo='\\~O' />
 	  <char num='214' name='Ouml' convertTo='\\@DOUBLEQUOTO' />
 	  <char num='215' name='times' convertTo='$\\times$' />
 	  <char num='216' name='Oslash' convertTo='\\O' />
 	  <char num='217' name='Ugrave' convertTo='\\`U' />
 	  <char num='218' name='Uacute' convertTo='\\@QUOTU' />
 	  <char num='219' name='Ucirc' convertTo='\\^U' />
 	  <char num='220' name='Uuml' convertTo='\\@DOUBLEQUOTU' />
 	  <char num='221' name='Yacute' convertTo='\\@QUOTY' />
 	  <char num='223' name='szlig' convertTo='\\ss' />
 	  <char num='224' name='agrave' convertTo='\\`a' />
 	  <char num='225' name='aacute' convertTo='\\@QUOTa' />
 	  <char num='226' name='acirc' convertTo='\\^a' />
 	  <char num='227' name='atilde' convertTo='\\~a' />
 	  <char num='228' name='auml' convertTo='\\@DOUBLEQUOTa' />
 	  <char num='229' name='aring' convertTo='\\aa' />
 	  <char num='230' name='aelig' convertTo='\\ae' />
 	  <char num='231' name='ccedil' convertTo='\\c{c}' />
 	  <char num='232' name='egrave' convertTo='\\`e' />
 	  <char num='233' name='eacute' convertTo='\\@QUOTe' />
 	  <char num='234' name='ecirc' convertTo='\\^e' />
 	  <char num='235' name='euml' convertTo='\\@DOUBLEQUOTe' />    
 	  <char num='236' name='igrave' convertTo='\\`i' />
 	  <char num='237' name='iacute' convertTo='\\@QUOTi' />
 	  <char num='238' name='icirc' convertTo='\\^i' />
 	  <char num='239' name='iuml' convertTo='\\@DOUBLEQUOTi' />
 	  <char num='240' name='eth' convertTo='$\\eth$' package='amssymb'/> <!-- -->
 	  <char num='241' name='ntilde' convertTo='\\~n' />
 	  <char num='242' name='ograve' convertTo='\\`o' />
 	  <char num='243' name='oacute' convertTo='\\@QUOTo' />
 	  <char num='244' name='ocirc' convertTo='\\^o' />
 	  <char num='245' name='otilde' convertTo='\\~o' />
 	  <char num='246' name='ouml' convertTo='\\@DOUBLEQUOTo' />
 <!--   <char num='247' name='divide' convertTo='$\\divide$' />       -->
 	  <char num='248' name='oslash' convertTo='\\o' /> 
 	  <char num='249' name='ugrave' convertTo='\\`u' />
 	  <char num='250' name='uacute' convertTo='\\@QUOTu' />
 	  <char num='251' name='ucirc' convertTo='\\^u' />
 	  <char num='252' name='uuml' convertTo='\\@DOUBLEQUOTu' />
 	  <char num='253' name='yacute' convertTo='\\@QUOTy' />
 	  <char num='255' name='yuml' convertTo='\\@DOUBLEQUOTy' />                  
 		<char num='222' name='THORN' convertTo='\\Thorn' package='wasysym' /> 
 		<char num='254' name='thorn' convertTo='\\thorn' package='wasysym' />
 	</chars>"
 end end end
--- a/lib/maruku/output/to_latex_strings.rb
+++ b/lib/maruku/output/to_latex_strings.rb
@ -0,0 +1,64 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 class String
 	# These are TeX's special characters
 	LATEX_ADD_SLASH = [ ?{, ?}, ?$, ?&, ?#, ?_, ?%]
 	# These, we transform to {\tt \char<ascii code>}
 	LATEX_TO_CHARCODE = [ ?^, ?~, ?>,?<]
 	def escape_to_latex(s)
 		s2 = ""
 		s.each_byte do |b|
 			if LATEX_TO_CHARCODE.include? b
 				s2 += "{\\tt \\char#{b}}" 
 			elsif LATEX_ADD_SLASH.include? b
 				s2 << ?\\ << b
 			elsif b == ?\\
 			# there is no backslash in cmr10 fonts
 				s2 += "$\\backslash$"
 			else
 				s2 << b
 			end
 		end
 		s2
 	end
 	# escapes special characters
 	def to_latex
 		s = escape_to_latex(self)
 		OtherGoodies.each do |k, v|
 			s.gsub!(k, v)
 		end
 		s
 	end
 	# other things that are good on the eyes
 	OtherGoodies = {
 		/(\s)LaTeX/ => '\1\\LaTeX\\xspace ', # XXX not if already \LaTeX
 #		'HTML' => '\\textsc{html}\\xspace ',
 #		'PDF' => '\\textsc{pdf}\\xspace '
 	}
 end
--- a/lib/maruku/output/to_markdown.rb
+++ b/lib/maruku/output/to_markdown.rb
@ -0,0 +1,164 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 class String
 	# XXX: markdown escaping
 	def to_md(c=nil)
 		to_s
 	end
 	# " andrea censi " => [" andrea ", "censi "]
 	def mysplit
 		split.map{|x| x+" "}
 	end
 end
 module MaRuKu; module Out; module Markdown 
 	DefaultLineLength = 40
 	def to_md(context={})
 		children_to_md(context)
 	end
 	def to_md_paragraph(context)
 		line_length = context[:line_length] || DefaultLineLength
 		wrap(@children, line_length, context)+"\n"
 	end
 	def to_md_li_span(context)
 		len = (context[:line_length] || DefaultLineLength) - 2
 		s = add_tabs(wrap(@children, len-2, context), 1, '  ')
 		s[0] = ?*
 		s + "\n"
 	end
 	def to_md_abbr_def(context)
 		"*[#{self.abbr}]: #{self.text}\n"
 	end
 	def to_md_ol(context)
 		len = (context[:line_length] || DefaultLineLength) - 2
 		md = ""
 		self.children.each_with_index do |li, i|
 			s = add_tabs(w=wrap(li.children, len-2, context), 1, '    ')+"\n"
 			s[0,4] = "#{i+1}.  "[0,4]
 #			puts w.inspect
 			md += s
 		end
 		md + "\n"
 	end
 	def to_md_ul(context)
 		len = (context[:line_length] || DefaultLineLength) - 2
 		md = ""
 		self.children.each_with_index do |li, i|
 			w = wrap(li.children, len-2, context)
 #			puts "W: "+ w.inspect
 			s = add_indent(w)
 #			puts "S: " +s.inspect
 			s[0,1] = "-"
 			md += s
 		end
 		md + "\n"
 	end
 	def add_indent(s,char="    ")
 		t = s.split("\n").map{|x| char+x }.join("\n")
 		s << ?\n if t[-1] == ?\n
 		s
 	end
 	# Convert each child to html
 	def children_to_md(context)
 		array_to_md(@children, context)
 	end
 	def wrap(array, line_length, context)
 		out = ""
 		line = ""
 		array.each do |c|
 			if c.kind_of?(MDElement) &&  c.node_type == :linebreak
 				out << line.strip << "  \n"; line="";
 				next
 			end
 			pieces =
 			if c.kind_of? String
 				c.to_md.mysplit
 			else
 				[c.to_md(context)].flatten
 			end
 	#			puts "Pieces: #{pieces.inspect}"
 			pieces.each do |p|
 				if p.size + line.size > line_length
 					out << line.strip << "\n"; 
 					line = ""
 				end
 				line << p
 			end
 		end
 		out << line.strip << "\n" if line.size > 0
 		out << ?\n if not out[-1] == ?\n
 		out
 	end
 	def array_to_md(array, context, join_char='')
 		e = []
 		array.each do |c|
 			method = c.kind_of?(MDElement) ? 
 			   "to_md_#{c.node_type}" : "to_md"
 			if not c.respond_to?(method)
 				#raise "Object does not answer to #{method}: #{c.class} #{c.inspect[0,100]}"
 #				tell_user "Using default for #{c.node_type}"
 				method = 'to_md'
 			end
 #			puts "#{c.inspect} created with method #{method}"
 			h =  c.send(method, context)
 			if h.nil?
 				raise "Nil md for #{c.inspect} created with method #{method}"
 			end
 			if h.kind_of?Array
 				e = e + h
 			else
 				e << h
 			end
 		end
 		e.join(join_char)
 	end
 end end end
 module MaRuKu; class MDDocument
 	alias old_md to_md
 	def to_md(context={})
 		s = old_md(context)
 #		puts s
 		s
 	end	
 end end
--- a/lib/maruku/output/to_s.rb
+++ b/lib/maruku/output/to_s.rb
@ -0,0 +1,53 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 module MaRuKu
 class MDElement
 	# Strips all formatting from the string
 	def to_s
 		 children_to_s
 	end
 	def children_to_s
 		@children.join
 	end
 	# Generate an id for headers. Assumes @children is set.
 	def generate_id
 		title = children_to_s
 		title.gsub!(/ /,'_')
 		title.downcase!
 		title.gsub!(/[^\w_]/,'')
 		title.strip!
 		if title.size == 0
 			$uid ||= 0
 			$uid += 1
 			title = "id#{$uid}"
 		end
 		title
 	end
 end
 end
--- a/lib/maruku/string_utils.rb
+++ b/lib/maruku/string_utils.rb
@ -0,0 +1,184 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 # Boring stuff with strings.
 module MaRuKu; module Strings
 	def add_tabs(s,n=1,char="\t")
 		s.split("\n").map{|x| char*n+x }.join("\n")
 	end
 	TabSize = 4;
 	def split_lines(s)
 		s.split("\n")
 	end
 	# This parses email headers. Returns an hash. 
 	#
 	# +hash['data']+ is the message.
 	#
 	# Keys are downcased, space becomes underscore, converted to symbols.
 	#
 	#     My key: true
 	#
 	# becomes:
 	#
 	#     {:my_key => true}
 	#
 	def parse_email_headers(s)
 		keys={}
 		match = (s =~ /((\w[\w\s]+: .*\n)+)\n/)
 		if match != 0
 			keys[:data] = s
 		else
 			keys[:data] = $'
 			headers = $1
 			headers.split("\n").each do |l| 
 				k, v = l.split(':')
 				k, v = normalize_key_and_value(k, v)
 				k = k.to_sym
 #				puts "K = #{k}, V=#{v}"
 				keys[k] = v
 			end
 		end
 		keys
 	end
 	# Keys are downcased, space becomes underscore, converted to symbols.
 	def normalize_key_and_value(k,v)
 		v = v ? v.strip : true # no value defaults to true
 		k = k.strip
 		# check synonyms
 		v = true if ['yes','true'].include?(v.to_s.downcase)
 		v = false if ['no','false'].include?(v.to_s.downcase)
 		k = k.downcase.gsub(' ','_')
 		return k, v
 	end
 	# Returns the number of leading spaces, considering that
 	# a tab counts as `TabSize` spaces.
 	def number_of_leading_spaces(s)
 		n=0; i=0;
 		while i < s.size 
 			c = s[i,1]
 			if c == ' '
 				i+=1; n+=1;
 			elsif c == "\t"
 				i+=1; n+=TabSize;
 			else
 				break
 			end
 		end
 		n
 	end
 	# This returns the position of the first real char in a list item
 	#
 	# For example: 
 	#     '*Hello' # => 1
 	#     '* Hello' # => 2
 	#     ' * Hello' # => 3
 	#     ' *   Hello' # => 5
 	#     '1.Hello' # => 2
 	#     ' 1.  Hello' # => 5
 	def spaces_before_first_char(s)
 		case s.md_type
 		when :ulist
 			i=0;
 			# skip whitespace if present
 			while s[i,1] =~ /\s/; i+=1 end
 			# skip indicator (+, -, *)
 			i+=1
 			# skip optional whitespace
 			while s[i,1] =~ /\s/; i+=1 end
 			return i
 		when :olist
 			i=0;
 			# skip whitespace
 			while s[i,1] =~ /\s/; i+=1 end
 			# skip digits
 			while s[i,1] =~ /\d/; i+=1 end
 			# skip dot
 			i+=1
 			# skip whitespace
 			while s[i,1] =~ /\s/; i+=1 end
 			return i
 		else
 			tell_user "BUG (my bad): '#{s}' is not a list"
 			0
 		end
 	end
 	# Counts the number of leading '#' in the string
 	def num_leading_hashes(s)
 		i=0;
 		while i<(s.size-1) && (s[i,1]=='#'); i+=1 end
 		i	
 	end
 	# Strips initial and final hashes
 	def strip_hashes(s)
 		s = s[num_leading_hashes(s), s.size]
 		i = s.size-1
 		while i > 0 && (s[i,1] =~ /(#|\s)/); i-=1; end
 		s[0, i+1].strip
 	end
 	# removes initial quote
 	def unquote(s)
 		s.gsub(/^>\s?/,'')
 	end
 	# toglie al massimo n caratteri
 	def strip_indent(s, n) 
 		i = 0
 		while i < s.size && n>0
 			c = s[i,1]
 			if c == ' '
 				n-=1;
 			elsif c == "\t"
 				n-=TabSize;
 			else
 				break
 			end
 			i+=1
 		end
 		s[i, s.size-1]
 	end
 	def dbg_describe_ary(a, prefix='')
 		i = 0 
 		a.each do |l|
 			puts "#{prefix} (#{i+=1})# #{l.inspect}"
 		end
 	end
 	def force_linebreak?(l)
 		l =~ /  $/
 	end
 end
 end
--- a/lib/maruku/structures.rb
+++ b/lib/maruku/structures.rb
@ -0,0 +1,165 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 class Module
 	def safe_attr_accessor1(symbol, klass)
 		attr_reader symbol
 		code = <<-EOF
 		def #{symbol}=(val)  
 			if not val.kind_of? #{klass}
 				s = "\nCould not assign an object of type \#{val.class} to #{symbol}.\n\n"
 				s += "Tried to assign object of class \#{val.class}:\n"+
 				     "\#{val.inspect}\n"+
 				     "to \#{self.class}::#{symbol} constrained to be of class #{klass}.\n"
 				raise s
 			end
 			@#{symbol} = val
 		end
 EOF
 		module_eval code
  end
 	def safe_attr_accessor2(symbol, klass)
 		attr_accessor symbol
 	end
 	alias  safe_attr_accessor  safe_attr_accessor2
 end
 module MaRuKu
 # I did not want to have a class for each possible element. 
 # Instead I opted to have only the class "MDElement"
 # that represents eveything in the document (paragraphs, headers, etc).
 #
 # You can tell what it is by the variable `node_type`. 
 #
 # In the instance-variable `children` there are the children. These
 # can be of class 1) String or 2) MDElement. 
 #
 # The @doc variable points to the document to which the MDElement
 # belongs (which is an instance of Maruku, subclass of MDElement).
 #
 # Attributes are contained in the hash `attributes`. 
 # Keys are symbols (downcased, with spaces substituted by underscores)
 #
 # For example, if you write in the source document.
 # 
 #     Title: test document
 #     My property: value
 #     
 #     content content
 #
 # You can access `value` by writing:
 #
 #     @doc.attributes[:my_property] # => 'value'
 #
 # from whichever MDElement in the hierarchy.
 #
 class MDElement 
 	# See helpers.rb for the list of allowed #node_type values
 	safe_attr_accessor :node_type, Symbol
 	# Children are either Strings or MDElement
 	safe_attr_accessor :children, Array
 	# An attribute list, may not be nil
 	safe_attr_accessor :al, Array #Maruku::AttributeList
 	# These are the processed attributes
 	safe_attr_accessor :attributes, Hash
 	# Reference of the document (which is of class Maruku)
 	attr_accessor :doc
 	def initialize(node_type=:unset, children=[], meta={}, 
 			al=MaRuKu::AttributeList.new )
 		super(); 
 		self.children = children
 		self.node_type = node_type
 		@attributes = {}
 		meta.each do |symbol, value|
 			self.instance_eval "
 			  def #{symbol}; @#{symbol}; end
 			  def #{symbol}=(val); @#{symbol}=val; end"
 			self.send "#{symbol}=", value
 		end
 		self.al = al || AttributeList.new
 		self.meta_priv = meta
 	end
 	attr_accessor :meta_priv
 	def ==(o)
 		ok = o.kind_of?(MDElement) &&
 		(self.node_type == o.node_type) &&
 		(self.meta_priv == o.meta_priv) &&
 		(self.children == o.children)
 		if not ok
 #			puts "This:\n"+self.inspect+"\nis different from\n"+o.inspect+"\n\n"
 		end
 		ok
 	end
 end
 # This represents the whole document and holds global data.
 class MDDocument
 	safe_attr_accessor :refs, Hash
 	safe_attr_accessor :footnotes, Hash
 	# This is an hash. The key might be nil.
 	safe_attr_accessor :abbreviations, Hash
 	# Attribute lists definition
 	safe_attr_accessor :ald, Hash
 	# The order in which footnotes are used. Contains the id.
 	safe_attr_accessor :footnotes_order, Array
 	safe_attr_accessor :latex_required_packages, Array
 	def initialize(s=nil)
 		super(:document)
 		@doc       = self
 		self.refs = {}
 		self.footnotes = {}
 		self.footnotes_order = []
 		self.abbreviations = {}
 		self.ald = {}
 		self.latex_required_packages = []
 		parse_doc(s) if s 
 	end
 end
 end # MaRuKu
--- a/lib/maruku/structures_inspect.rb
+++ b/lib/maruku/structures_inspect.rb
@ -0,0 +1,87 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 class String
 	def inspect_more(a=nil,b=nil)
 		inspect
 	end
 end
 class Object
 	def inspect_more(a=nil,b=nil)
 		inspect
 	end
 end
 class Array
 	def inspect_more(compact, join_string, add_brackets=true)
 		s  = map {|x| 
 			x.kind_of?(String) ? x.inspect : 
 			x.kind_of?(MaRuKu::MDElement) ? x.inspect(compact) : 
 			(raise "WTF #{x.class} #{x.inspect}")
 		}.join(join_string)
 		add_brackets ? "[#{s}]" : s
 	end
 end
 class Hash
 	def inspect_ordered(a=nil,b=nil)
 		"{"+keys.map{|x|x.to_s}.sort.map{|x|x.to_sym}.
 		map{|k| k.inspect + "=>"+self[k].inspect}.join(',')+"}"
 	end
 end
 module MaRuKu
 class MDElement	
 	def inspect(compact=true)
 		if compact
 			i2 = inspect2
 			return i2 if i2
 		end
 		"md_el(:%s,%s,%s,%s)" %
 		[
 			self.node_type,
 			children_inspect(compact), 
 			@meta_priv.inspect_ordered,
 			self.al.inspect
 		]
 	end
 	def children_inspect(compact=true)
 		s = @children.inspect_more(compact,', ')
 		if @children.empty?
 			"[]"
 		elsif s.size < 70
 			s
 		else
 			"[\n"+
 			add_tabs(@children.inspect_more(compact,",\n",false))+
 			"\n]"
 		end
 	end
 end
 end
--- a/lib/maruku/structures_iterators.rb
+++ b/lib/maruku/structures_iterators.rb
@ -0,0 +1,61 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 module MaRuKu
 class MDElement
 	# Yields to each element of specified node_type
 	# All elements if e_node_type is nil.
 	def each_element(e_node_type=nil, &block) 
 		@children.each do |c| 
 			if c.kind_of? MDElement
 				if (not e_node_type) || (e_node_type == c.node_type)
 					block.call c
 				end
 				c.each_element(e_node_type, &block)
 			end
 		end
 	end
 	# Apply passed block to each String in the hierarchy.
 	def replace_each_string(&block)
 		for c in @children
 			if c.kind_of? MDElement
 				c.replace_each_string(&block)
 			end
 		end
 		processed = []
 		until @children.empty?
 			c = @children.shift
 			if c.kind_of? String
 				result = block.call(c)
 				[*result].each do |e| processed << e end
 			else
 				processed << c
 			end
 		end
 		@children = processed
 	end
 end
 end
--- a/lib/maruku/tests/benchmark.rb
+++ b/lib/maruku/tests/benchmark.rb
@ -0,0 +1,82 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 require 'maruku'
 require 'bluecloth'
 data = $stdin.read
 num = 10
 if ARGV.size > 0 && ((n=ARGV[0].to_i) != 0)
 	num = n
 end
 methods = 
 [
 	[Maruku,    :to_html],
 	[BlueCloth, :to_html],
 	[Maruku,    :to_latex]
 ]
 #methods = [[Maruku, :class]]
 #num = 10
 stats = 
 methods .map do |c, method|
 	puts "Computing for #{c}"
 	start = Time.now
 	doc = nil
 	for i in 1..num
 		$stdout.write "#{i} "; $stdout.flush
 		doc = c.new(data)
 	end
 	stop = Time.now
 	parsing = (stop-start)/num
 	start = Time.now
 	for i in 1..num
 		$stdout.write "#{i} "; $stdout.flush
 		s = doc.send method
 	end
 	stop = Time.now
 	rendering = (stop-start)/num
 	puts ("%s (%s): parsing %0.2f sec + rendering %0.2f sec "+
 	"= %0.2f sec ") % [c, method, parsing,rendering,parsing+rendering]
 	[c, method, parsing, rendering]
 end
 puts "\n\n\n"
 stats.each do |x| x.push(x[2]+x[3]) end
 max = stats.map{|x|x[4]}.max
 stats.sort! { |x,y| x[4] <=> y[4] } . reverse!
 for c, method, parsing, rendering, tot in stats
 	puts ("%20s: parsing %0.2f sec + rendering %0.2f sec "+
 	"= %0.2f sec   (%0.2fx)") % 
 	["#{c} (#{method})", parsing,rendering,tot,max/tot]
 end
--- a/lib/maruku/tests/new_parser.rb
+++ b/lib/maruku/tests/new_parser.rb
@ -0,0 +1,359 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 require 'maruku'
 module MaRuKu; module Tests
 	# 5 accented letters in italian, encoded as UTF-8
 	AccIta8 = "\303\240\303\250\303\254\303\262\303\271"
 	# Same letters, written in ISO-8859-1 (one byte per letter)
 	AccIta1 = "\340\350\354\362\371"
 	# The word MA-RU-KU, written in katakana using UTF-8
 	Maruku8 = "\343\203\236\343\203\253\343\202\257"
 	def test_span_parser(verbose, break_on_first_error, quiet)
 	good_cases = [
 		["",       [],         'Empty string gives empty list'],
 		["a",      ["a"],      'Easy char'],
 		[" a",     ["a"],      'First space in the paragraph is ignored'],
 		["a\n \n", ["a"],      'Last spaces in the paragraphs are ignored'],
 		[' ',      [],      'One char => nothing'],
 		['  ',     [],      'Two chars => nothing'],
 		['a  b',   ['a b'],    'Spaces are compressed'],
 		['a  b',   ['a b'],    'Newlines are spaces'],
 		["a\nb",   ['a b'],    'Newlines are spaces'],
 		["a\n b",  ['a b'],    'Compress newlines 1'],
 		["a \nb",  ['a b'],    'Compress newlines 2'],
 		[" \nb",   ['b'],      'Compress newlines 3'],
 		["\nb",    ['b'],      'Compress newlines 4'],
 		["b\n",    ['b'],     'Compress newlines 5'],
 		["\n",     [],      'Compress newlines 6'],
 		["\n\n\n", [],      'Compress newlines 7'],
 		[nil, :throw, "Should throw on nil input"],
 		# Code blocks
 		["`" ,   :throw,  'Unclosed single ticks'],
 		["``" ,  :throw,  'Unclosed double ticks'],
 		["`a`" ,     [md_code('a')],    'Simple inline code'],
 		["`` ` ``" ,    [md_code('`')],   ],
 		["`` \\` ``" ,    [md_code('\\`')],   ],
 		["``a``" ,   [md_code('a')],    ],
 		["`` a ``" ,   [md_code('a')],    ],
 		# Newlines 
 		["a  \n", ['a',md_el(:linebreak)], 'Two spaces give br.'],
 		["a \n",  ['a'], 'Newlines 2'],
 		["  \n",  [md_el(:linebreak)], 'Newlines 3'],
 		["  \n  \n",  [md_el(:linebreak),md_el(:linebreak)],'Newlines 3'],
 		["  \na  \n",  [md_el(:linebreak),'a',md_el(:linebreak)],'Newlines 3'],
 		# Inline HTML
 		["a < b", ['a < b'], '< can be on itself'],
 		["<hr>",  [md_html('<hr />')], 'HR will be sanitized'],
 		["<hr/>", [md_html('<hr />')], 'Closed tag is ok'],
 		["<hr  />", [md_html('<hr />')], 'Closed tag is ok 2'],
 		["<hr/>a", [md_html('<hr />'),'a'], 'Closed tag is ok 2'],
 		["<em></em>a", [md_html('<em></em>'),'a'], 'Inline HTML 1'],
 		["<em>e</em>a", [md_html('<em>e</em>'),'a'], 'Inline HTML 2'],
 		["a<em>e</em>b", ['a',md_html('<em>e</em>'),'b'], 'Inline HTML 3'],
 		["<em>e</em>a<em>f</em>", 
 			[md_html('<em>e</em>'),'a',md_html('<em>f</em>')], 
 			'Inline HTML 4'],
 		["<em>e</em><em>f</em>a", 
 			[md_html('<em>e</em>'),md_html('<em>f</em>'),'a'], 
 			'Inline HTML 5'],
 			["<img src='a' />", [md_html("<img src='a' />")], 'Attributes'],
 			["<img src='a'/>"],
 		# emphasis
 		["**", :throw, 'Unclosed double **'],
 		["\\*", ['*'], 'Escaping of *'],
 		["a *b* ", ['a ', md_em('b')], 'Emphasis 1'],
 		["a *b*", ['a ', md_em('b')], 'Emphasis 2'],
 		["a * b", ['a * b'], 'Emphasis 3'],
 		["a * b*", :throw, 'Unclosed emphasis'],
 		# same with underscore
 		["__", :throw, 'Unclosed double __'],
 		["\\_", ['_'], 'Escaping of _'],
 		["a _b_ ", ['a ', md_em('b')], 'Emphasis 4'],
 		["a _b_", ['a ', md_em('b')], 'Emphasis 5'],
 		["a _ b", ['a _ b'], 'Emphasis 6'],
 		["a _ b_", :throw, 'Unclosed emphasis'],
 		["_b_", [md_em('b')], 'Emphasis 7'],
 		["_b_ _c_", [md_em('b'),' ',md_em('c')], 'Emphasis 8'],
 		["_b__c_", [md_em('b'),md_em('c')], 'Emphasis 9'],
 		# strong
 		["**a*", :throw, 'Unclosed double ** 2'],
 		["\\**a*", ['*', md_em('a')], 'Escaping of *'],
 		["a **b** ", ['a ', md_strong('b')], 'Emphasis 1'],
 		["a **b**", ['a ', md_strong('b')], 'Emphasis 2'],
 		["a ** b", ['a ** b'], 'Emphasis 3'],
 		["a ** b**", :throw, 'Unclosed emphasis'],
 		["**b****c**", [md_strong('b'),md_strong('c')], 'Emphasis 9'],
 		# strong (with underscore)
 		["__a_", :throw, 'Unclosed double __ 2'],
 		["\\__a_", ['_', md_em('a')], 'Escaping of _'],
 		["a __b__ ", ['a ', md_strong('b')], 'Emphasis 1'],
 		["a __b__", ['a ', md_strong('b')], 'Emphasis 2'],
 		["a __ b", ['a __ b'], 'Emphasis 3'],
 		["a __ b__", :throw, 'Unclosed emphasis'],
 		["__b____c__", [md_strong('b'),md_strong('c')], 'Emphasis 9'],
 		# extra strong
 		["***a**", :throw, 'Unclosed triple *** '],
 		["\\***a**", ['*', md_strong('a')], 'Escaping of *'],
 		["a ***b*** ", ['a ', md_emstrong('b')], 'Strong elements'],
 		["a ***b***", ['a ', md_emstrong('b')]],
 		["a *** b", ['a *** b']],
 		["a ** * b", ['a ** * b']],
 		["***b******c***", [md_emstrong('b'),md_emstrong('c')]],
 		["a *** b***", :throw, 'Unclosed emphasis'],
 		# same with underscores
 		["___a__", :throw, 'Unclosed triple *** '],
 		["\\___a__", ['_', md_strong('a')], 'Escaping of *'],
 		["a ___b___ ", ['a ', md_emstrong('b')], 'Strong elements'],
 		["a ___b___", ['a ', md_emstrong('b')]],
 		["a ___ b", ['a ___ b']],
 		["a __ _ b", ['a __ _ b']],
 		["___b______c___", [md_emstrong('b'),md_emstrong('c')]],
 		["a ___ b___", :throw, 'Unclosed emphasis'],
 		# mixing is bad
 		["*a_", :throw, 'Mixing is bad'],
 		["_a*", :throw],
 		["**a__", :throw],
 		["__a**", :throw],
 		["___a***", :throw],
 		["***a___", :throw],
 		# links of the form [text][ref]
 		["\\[a]",  ["[a]"], 'Escaping 1'],
 		["\\[a\\]", ["[a]"], 'Escaping 2'],
 		["[a]",   ["a"],   'Not a link'],
 		["[a][]",   [ md_link(["a"],'')], 'Empty link'],
 		["[a][]b",   [ md_link(["a"],''),'b'], 'Empty link'],
 		["[a\\]][]", [ md_link(["a]"],'')], 'Escape inside link'],
 		["[a",  :throw,   'Link not closed'],
 		["[a][",  :throw,   'Ref not closed'],
 		# links of the form [text](url)
 		["\\[a](b)",  ["[a](b)"], 'Links'],
 		["[a](url)c",  [md_im_link(['a'],'url'),'c'], 'url'],
 		["[a]( url )c" ],
 		["[a] (	url )c" ],
 		["[a] (	url)c" ],
 		["[a](ur:/l/ 'Title')",  [md_im_link(['a'],'ur:/l/','Title')],
 		 	'url and title'],
 		["[a] (	ur:/l/ \"Title\")" ],
 		["[a] (	ur:/l/ \"Title\")" ],
 		["[a]( ur:/l/ Title)", :throw, "Must quote title" ],
 		["[a](url 'Tit\\\"l\\\\e')", [md_im_link(['a'],'url','Tit"l\\e')],
 		 	'url and title escaped'],
 		["[a] (	url \"Tit\\\"l\\\\e\")" ],
 		["[a] (	url	\"Tit\\\"l\\\\e\"  )" ],
 		['[a] (	url	"Tit\\"l\\\\e"  )' ],
 		["[a]()", [md_im_link(['a'],'')], 'No URL is OK'],
 		["[a](\"Title\")", :throw, "No url specified" ],
 		["[a](url \"Title)", :throw, "Unclosed quotes" ],
 		["[a](url \"Title\\\")", :throw],
 		["[a](url \"Title\" ", :throw],
 		["[a](url \'Title\")", :throw, "Mixing is bad" ],
 		["[a](url \"Title\')"],
 		["[a](/url)", [md_im_link(['a'],'/url')], 'Funny chars in url'],
 		["[a](#url)", [md_im_link(['a'],'#url')]],
 		["[a](</script?foo=1&bar=2>)", [md_im_link(['a'],'/script?foo=1&bar=2')]],
 		# Images
 		["\\![a](url)",  ['!', md_im_link(['a'],'url') ], 'Escaping images'],
 		["![a](url)",  [md_im_image(['a'],'url')], 'Image no title'],
 		["![a]( url )" ],
 		["![a] (	url )" ],
 		["![a] (	url)" ],
 		["![a](url 'ti\"tle')",  [md_im_image(['a'],'url','ti"tle')], 'Image with title'],
 		['![a]( url "ti\\"tle")' ],
 		["![a](url", :throw, 'Invalid images'],
 		["![a( url )" ],
 		["![a] ('url )" ],
 		["![a][imref]",  [md_image(['a'],'imref')], 'Image with ref'],
 		["![a][ imref]"],
 		["![a][ imref ]"],
 		["![a][\timref\t]"],
 		['<http://example.com/?foo=1&bar=2>', 
 			[md_url('http://example.com/?foo=1&bar=2')], 'Immediate link'],
 			['a<http://example.com/?foo=1&bar=2>b', 
 				['a',md_url('http://example.com/?foo=1&bar=2'),'b']  ],
 		['<andrea@censi.org>', 
 			[md_email('andrea@censi.org')], 'Email address'],
 		['<mailto:andrea@censi.org>'],
 		["Developmen <http://rubyforge.org/projects/maruku/>",
 			 ["Developmen ", md_url("http://rubyforge.org/projects/maruku/")]],
 		["a<!-- -->b", ['a',md_html('<!-- -->'),'b'], 
 			'HTML Comment'],
 		["a<!--", :throw, 'Bad HTML Comment'],
 		["a<!-- ", :throw, 'Bad HTML Comment'],
 		["<?xml <?!--!`3  ?>", [md_xml_instr('xml','<?!--!`3')], 'XML processing instruction'],
 		["<? <?!--!`3  ?>", [md_xml_instr('','<?!--!`3')] ],
 		["<? ", :throw, 'Bad Server directive'],
 		["a <b", :throw, 'Bad HTML 1'],
 		["<b",   :throw, 'Bad HTML 2'],
 		["<b!",  :throw, 'Bad HTML 3'],
 		['`<div>`, `<table>`, `<pre>`, `<p>`',
 			[md_code('<div>'),', ',md_code('<table>'),', ',
 				md_code('<pre>'),', ',md_code('<p>')],
 				'Multiple HTLM tags'],
 		["&andrea", ["&andrea"], 'Parsing of entities'],
 # no escaping is allowed
 #			["\\&andrea;", ["&andrea;"]],
 		["l&andrea;", ["l", md_entity('andrea')] ],
 		["&&andrea;", ["&", md_entity('andrea')] ],
 		["&123;;&amp;",[md_entity('123'),';',md_entity('amp')]],
 		["a\nThe [syntax page] [s] provides", 
 			['a The ', md_link(['syntax page'],'s'), ' provides'], 'Regression'],
 		['![a](url "ti"tle")', [md_im_image(['a'],'url','ti"tle')], 
 			"Image with quotes"],
 		['![a](url \'ti"tle\')' ],
 		['[bar](/url/ "Title with "quotes" inside")', 
 			[md_im_link(["bar"],'/url/', 'Title with "quotes" inside')],
 			"Link with quotes"],
 		['$20,000 and $30,000', ['$20,000 and $30,000'], 'Math: spaces'],
 		['$20,000$', [md_inline_math('20,000')]],
 		['$ 20,000$', ['$ 20,000$']],
 		['$20,000 $ $20,000$', ['$20,000 $ ', md_inline_math('20,000')]],
 		["#{Maruku8}", [Maruku8], "Reading UTF-8"],
 		["#{AccIta1}", [AccIta8], "Converting ISO-8859-1 to UTF-8", 
 			{:encoding => 'iso-8859-1'}],
 	]
 		good_cases = unit_tests_for_attribute_lists + good_cases
 		count = 1; last_comment=""; last_expected=:throw
 		good_cases.each do |t|
 			if not t[1]
 				t[1] = last_expected
 			else
 				last_expected = t[1]
 			end				
 			if not t[2]
 				t[2] = last_comment + " #{count+=1}"
 			else
 				last_comment = t[2]; count=1
 			end
 		end
 		@verbose = verbose
 		m = Maruku.new
 		m.attributes[:on_error] = :raise
 		Globals[:debug_keep_ials] = true
 		good_cases.each do |input, expected, comment|
 				output = nil
 				begin
 					output = m.parse_span_better(input)
 					#lines = Maruku.split_lines input
 					#output = m.parse_lines_as_span(lines)
 				rescue Exception => e
 					if not expected == :throw
 						ex = e.inspect+ "\n"+ e.backtrace.join("\n")
 						s = comment+describe_difference(input, expected, output)
 						print_status(comment,'CRASHED :-(', ex+s)
 						raise e if @break_on_first_error 
 					else
 						quiet || print_status(comment,'OK')
 					end
 				end
 				if not expected == :throw
 					if not (expected == output)
 						s = comment+describe_difference(input, expected, output)
 						print_status(comment, 'FAILED', s)
 						break if break_on_first_error
 					else
 						quiet || print_status(comment, 'OK')
 					end
 				else # I expected a raise
 					if output
 						s = comment+describe_difference(input, expected, output)
 						print_status(comment, 'FAILED (no throw)', s)
 						break if break_on_first_error
 					end
 				end
 		end
 	end
 	PAD=40
 	def print_status(comment, status, verbose_text=nil)
 		if comment.size < PAD
 			comment = comment + (" "*(PAD-comment.size))
 		end
 		puts "- #{comment} #{status}"
 		if @verbose and verbose_text
 			puts verbose_text
 		end
 	end
 	def describe_difference(input, expected, output)
 		"\nInput:\n  #{input.inspect}" +
 		    "\nExpected:\n  #{expected.inspect}" +
 			"\nOutput:\n  #{output.inspect}\n"
 	end
 end end
 class Maruku
 	include MaRuKu::Tests
 end
 verbose = ARGV.include? 'v'
 break_on_first = ARGV.include? 'b'
 quiet = ARGV.include? 'q'
 Maruku.new.test_span_parser(verbose, break_on_first, quiet)
--- a/lib/maruku/tests/tests.rb
+++ b/lib/maruku/tests/tests.rb
@ -0,0 +1,136 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 require 'maruku'
 class Maruku
 	def Maruku.failed(test, doc, s)
 		raise "Test failed: #{s}\n*****\n#{test}\n*****\n"+
 		"#{doc.inspect}\n*****\n{doc.to_html}"
 	end
 	def Maruku.metaTests
 		ref = {:id => 'id1', :class => ['class1','class2'], 
 			:style=> 'Style is : important = for all } things'}
 		tests = MetaTests.split('***')
 		for test in tests
 			#puts "Test: #{test.inspect}"
 			doc = Maruku.new(test)
 			doc.children.size == 1 ||
 			failed(test, doc, "children != 1") 
 			h = doc.children[0]
 			h.node_type==:header ||
 			failed(test, doc, "child not header") 
 #			puts doc.inspect
 #			puts doc.to_html
 		end
 	end
 MetaTests = <<EOF
 # Head # {ref1 ref2 ref3}
 {ref1}: id: id1; class: class1
 {ref2}: class: class2
 {ref3}: style: "Style is : important = for all } things"  
 ***
 # Head # {ref1 ref3 ref2}
 {ref1}: id: id1; class: class1
 {ref2}: class: class2
 {ref3}: style: "Style is : important = for all } things"  
 ***
 # Head # {ref1 ref2 ref3}
 {ref1}: id= id1; class=class1
 {ref2}: class=class2
 {ref3}: style="Style is : important = for all } things"
 ***
 # Head # {ref1 ref2 ref3}
 {ref1}: id=id1 class=class1
 {ref2}: class=class2
 {ref3}: style="Style is : important = for all } things"
 ***
 # Head # {ref1 ref2 ref3}
 {ref1}: id:id1	class:class1
 {ref2}: class : class2
 {ref3}: style	=	"Style is : important = for all } things"
 ***
 # Head # {ref1 ref2 ref3}
 {ref1}: id:id1	class:class1
  {ref2}: class : class2
   {ref3}: style	=	"Style is : important = for all } things"
 ***
 # Head # {#id1 .class1 ref2 ref3}
 {ref2}: class : class2
 {ref3}: style	=	"Style is : important = for all } things"
 ***
 # Head #  	 {  #id1	.class1	 	ref2	  ref3	}
 {ref2}: class : class2
 {ref3}: style	=	"Style is : important = for all } things"
 ***
 # Head #  	 {  id=id1	class=class1	 	ref2	  ref3	}
 {ref2}: class : class2
 {ref3}: style	=	"Style is : important = for all } things"
 ***
 # Head #  	 {  id:id1	class="class1" class:"class2"  style="Style is : important = for all } things"}
 EOF
 end
 if File.basename($0) == 'tests.rb'
 	Maruku.metaTests
 end
--- a/lib/maruku/toc.rb
+++ b/lib/maruku/toc.rb
@ -0,0 +1,199 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 module MaRuKu
 class MDDocument
 	# an instance of Section (see below)
 	attr_accessor :toc 
 end
 	# This represents a section in the TOC.
 	class Section
 		# a Fixnum, is == header_element.level
 		attr_accessor :section_level 
 		# An array of fixnum, like [1,2,5] for Section 1.2.5
 		attr_accessor :section_number 
 		# reference to header (header has h.meta[:section] to self)
 		attr_accessor :header_element
 		# Array of immediate children of this element
 		attr_accessor :immediate_children
 		# Array of Section inside this section
 		attr_accessor :section_children
 		def initialize
 			@immediate_children = []
 			@section_children = []
 		end
 	end 
 	class Section
 		def inspect(indent=1)
 			s = ""
 			if @header_element
 				s +=  "\_"*indent +  "(#{@section_level})>\t #{@section_number.join('.')} : "
 				s +=  @header_element.children_to_s +
 				 " (id: '#{@header_element.attributes[:id]}')\n"
 			else
 				s += "Master\n"
 			end
 			@section_children.each do |c|
 				s+=c.inspect(indent+1)
 			end
 			s
 		end
 		# Numerate this section and its children
 		def numerate(a=[])
 			self.section_number = a
 			section_children.each_with_index do |c,i|
 				c.numerate(a.clone.push(i+1))
 			end
 			if h = self.header_element
 				h.attributes[:section_number] = self.section_number
 			end
 		end
 		include REXML
 		# Creates an HTML toc.
 		# Call this on the root 
 		def to_html
 			div = Element.new 'div'
 			div.attributes['class'] = 'maruku_toc'
 			div << create_toc
 			div
 		end
 		def create_toc
 			ul = Element.new 'ul'
 			# let's remove the bullets
 			ul.attributes['style'] = 'list-style: none;' 
 			@section_children.each do |c|
 				li = Element.new 'li'
 				if span = c.header_element.render_section_number
 					li << span
 				end
 				a = c.header_element.wrap_as_element('a')
 					a.delete_attribute 'id'
 					a.attributes['href'] = "##{c.header_element.attributes[:id]}"
 				li << a
 				li << c.create_toc if c.section_children.size>0
 				ul << li
 			end
 			ul
 		end
 		# Creates a latex toc.
 		# Call this on the root 
 		def to_latex
 			to_latex_rec + "\n\n"
 		end
 		def to_latex_rec
 			s = ""
 			@section_children.each do |c|
 				s += "\\noindent"
 				number = c.header_element.section_number
 				s += number if number
 					text = c.header_element.children_to_latex
 					id = c.header_element.attributes[:id]
 				s += "\\hyperlink{#{id}}{#{text}}"
 				s += "\\dotfill \\pageref*{#{id}} \\linebreak\n"
 				s += c.to_latex_rec  if c.section_children.size>0
 			end
 			s
 		end
 	end
 	class MDDocument
 		def create_toc
 			each_element(:header) do |h|
 				h.attributes[:id] ||= h.generate_id
 			end
 			stack = []
 			# the ancestor section
 			s = Section.new
 			s.section_level = 0
 			stack.push s
 			i = 0;
 			while i < @children.size
 				while i < @children.size 
 					if @children[i].node_type == :header
 						level = @children[i].level
 						break if level <= stack.last.section_level+1
 					end
 					stack.last.immediate_children.push @children[i]
 					i += 1
 				end
 				break if i>=@children.size
 				header = @children[i]
 				level = header.level
 				if level > stack.last.section_level
 					# this level is inside
 					s2 = Section.new
 					s2.section_level = level
 					s2.header_element = header
 					header.instance_variable_set :@section, s2
 					stack.last.section_children.push s2
 					stack.push s2
 					i+=1
 				elsif level == stack.last.section_level
 					# this level is a sibling
 					stack.pop
 				else 
 					# this level is a parent
 					stack.pop
 				end
 			end
 			# If there is only one big header, then assume
 			# it is the master
 			if s.section_children.size == 1
 				s = s.section_children.first
 			end
 			# Assign section numbers
 			s.numerate
 			s
 		end
 	end
 end
--- a/lib/maruku/usage/example1.rb
+++ b/lib/maruku/usage/example1.rb
@ -0,0 +1,33 @@
 require 'maruku'
 text = <<EOF
 Chapter 1
 =========
 It was a stormy and rainy night.
 EOF
 invalid = <<EOF
 This is a [bad link.
 EOF
 Maruku.new(text).to_html
 s = ""
 begin 
 	Maruku.new(invalid, {:on_error => :raise, :error_stream => s})
 	puts "Error! It should have thrown an exception."
 rescue
 	# puts "ok, got error"
 end
 begin 
 	Maruku.new(invalid, {:on_error => :warning, :error_stream => s})
 rescue
 	puts "Error! It should not have thrown an exception."
 end
--- a/lib/maruku/version.rb
+++ b/lib/maruku/version.rb
@ -0,0 +1,38 @@
 #--
 #   Copyright (C) 2006  Andrea Censi  <andrea (at) rubyforge.org>
 #
 # This file is part of Maruku.
 # 
 #   Maruku is free software; you can redistribute it and/or modify
 #   it under the terms of the GNU General Public License as published by
 #   the Free Software Foundation; either version 2 of the License, or
 #   (at your option) any later version.
 # 
 #   Maruku is distributed in the hope that it will be useful,
 #   but WITHOUT ANY WARRANTY; without even the implied warranty of
 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #   GNU General Public License for more details.
 # 
 #   You should have received a copy of the GNU General Public License
 #   along with Maruku; if not, write to the Free Software
 #   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #++
 module MaRuKu
 	Version = '0.4.2.1'
 	MarukuURL = 'http://maruku.rubyforge.org/'
 	# If true, use also PHP Markdown extra syntax
 	#
 	# Note: it is not guaranteed that if it's false
 	# then no special features will be used.
 	def markdown_extra?
 		true
 	end
 	def new_meta_data?
 		true
 	end
 end
--- a/lib/syntax.rb
+++ b/lib/syntax.rb
@ -0,0 +1,38 @@
 require 'syntax/common'
 module Syntax
  # A default tokenizer for handling syntaxes that are not explicitly handled
  # elsewhere. It simply yields the given text as a single token.
  class Default
    # Yield the given text as a single token.
    def tokenize( text )
      yield Token.new( text, :normal )
    end
  end
  # A hash for registering syntax implementations.
  SYNTAX = Hash.new( Default )
  # Load the implementation of the requested syntax. If the syntax cannot be
  # found, or if it cannot be loaded for whatever reason, the Default syntax
  # handler will be returned.
  def load( syntax )
    begin
      require "syntax/lang/#{syntax}"
    rescue LoadError
    end
    SYNTAX[ syntax ].new
  end
  module_function :load
  # Return an array of the names of supported syntaxes.
  def all
    lang_dir = File.join(File.dirname(__FILE__), "syntax", "lang")
    Dir["#{lang_dir}/*.rb"].map { |path| File.basename(path, ".rb") }
  end
  module_function :all
 end
--- a/lib/syntax/common.rb
+++ b/lib/syntax/common.rb
@ -0,0 +1,163 @@
 require 'strscan'
 module Syntax
  # A single token extracted by a tokenizer. It is simply the lexeme
  # itself, decorated with a 'group' attribute to identify the type of the
  # lexeme.
  class Token < String
    # the type of the lexeme that was extracted.
    attr_reader :group
    # the instruction associated with this token (:none, :region_open, or
    # :region_close)
    attr_reader :instruction
    # Create a new Token representing the given text, and belonging to the
    # given group.
    def initialize( text, group, instruction = :none )
      super text
      @group = group
      @instruction = instruction
    end
  end
  # The base class of all tokenizers. It sets up the scanner and manages the
  # looping until all tokens have been extracted. It also provides convenience
  # methods to make sure adjacent tokens of identical groups are returned as
  # a single token.
  class Tokenizer
    # The current group being processed by the tokenizer
    attr_reader :group
    # The current chunk of text being accumulated
    attr_reader :chunk
    # Start tokenizing. This sets up the state in preparation for tokenization,
    # such as creating a new scanner for the text and saving the callback block.
    # The block will be invoked for each token extracted.
    def start( text, &block )
      @chunk = ""
      @group = :normal
      @callback = block
      @text = StringScanner.new( text )
      setup
    end
    # Subclasses may override this method to provide implementation-specific
    # setup logic.
    def setup
    end
    # Finish tokenizing. This flushes the buffer, yielding any remaining text
    # to the client.
    def finish
      start_group nil
      teardown
    end
    # Subclasses may override this method to provide implementation-specific
    # teardown logic.
    def teardown
    end
    # Subclasses must implement this method, which is called for each iteration
    # of the tokenization process. This method may extract multiple tokens.
    def step
      raise NotImplementedError, "subclasses must implement #step"
    end
    # Begins tokenizing the given text, calling #step until the text has been
    # exhausted.
    def tokenize( text, &block )
      start text, &block
      step until @text.eos?
      finish
    end
    # Specify a set of tokenizer-specific options. Each tokenizer may (or may
    # not) publish any options, but if a tokenizer does those options may be
    # used to specify optional behavior.
    def set( opts={} )
      ( @options ||= Hash.new ).update opts
    end
    # Get the value of the specified option.
    def option(opt)
      @options ? @options[opt] : nil
    end
    private
      EOL = /(?=\r\n?|\n|$)/
      # A convenience for delegating method calls to the scanner.
      def self.delegate( sym )
        define_method( sym ) { |*a| @text.__send__( sym, *a ) }
      end
      delegate :bol?
      delegate :eos?
      delegate :scan
      delegate :scan_until
      delegate :check
      delegate :check_until
      delegate :getch
      delegate :matched
      delegate :pre_match
      delegate :peek
      delegate :pos
      # Access the n-th subgroup from the most recent match.
      def subgroup(n)
        @text[n]
      end
      # Append the given data to the currently active chunk.
      def append( data )
        @chunk << data
      end
      # Request that a new group be started. If the current group is the same
      # as the group being requested, a new group will not be created. If a new
      # group is created and the current chunk is not empty, the chunk's
      # contents will be yielded to the client as a token, and then cleared.
      #
      # After the new group is started, if +data+ is non-nil it will be appended
      # to the chunk.
      def start_group( gr, data=nil )
        flush_chunk if gr != @group
        @group = gr
        @chunk << data if data
      end
      def start_region( gr, data=nil )
        flush_chunk
        @group = gr
        @callback.call( Token.new( data||"", @group, :region_open ) )
      end
      def end_region( gr, data=nil )
        flush_chunk
        @group = gr
        @callback.call( Token.new( data||"", @group, :region_close ) )
      end
      def flush_chunk
        @callback.call( Token.new( @chunk, @group ) ) unless @chunk.empty?
        @chunk = ""
      end
      def subtokenize( syntax, text )
        tokenizer = Syntax.load( syntax )
        tokenizer.set @options if @options
        flush_chunk
        tokenizer.tokenize( text, &@callback )
      end
  end
 end
--- a/lib/syntax/convertors/abstract.rb
+++ b/lib/syntax/convertors/abstract.rb
@ -0,0 +1,27 @@
 require 'syntax'
 module Syntax
  module Convertors
    # The abstract ancestor class for all convertors. It implements a few
    # convenience methods to provide a common interface for all convertors.
    class Abstract
      # A reference to the tokenizer used by this convertor.
      attr_reader :tokenizer
      # A convenience method for instantiating a new convertor for a
      # specific syntax.
      def self.for_syntax( syntax )
        new( Syntax.load( syntax ) )
      end
      # Creates a new convertor that uses the given tokenizer.
      def initialize( tokenizer )
        @tokenizer = tokenizer
      end
    end
  end
 end
--- a/lib/syntax/convertors/html.rb
+++ b/lib/syntax/convertors/html.rb
@ -0,0 +1,51 @@
 require 'syntax/convertors/abstract'
 module Syntax
  module Convertors
    # A simple class for converting a text into HTML.
    class HTML < Abstract
      # Converts the given text to HTML, using spans to represent token groups
      # of any type but <tt>:normal</tt> (which is always unhighlighted). If
      # +pre+ is +true+, the html is automatically wrapped in pre tags.
      def convert( text, pre=true )
        html = ""
        html << "<pre>" if pre
        regions = []
        @tokenizer.tokenize( text ) do |tok|
          value = html_escape(tok)
          case tok.instruction
            when :region_close then
              regions.pop
              html << "</span>"
            when :region_open then
              regions.push tok.group
              html << "<span class=\"#{tok.group}\">#{value}"
            else
              if tok.group == ( regions.last || :normal )
                html << value
              else
                html << "<span class=\"#{tok.group}\">#{value}</span>"
              end
          end
        end
        html << "</span>" while regions.pop
        html << "</pre>" if pre
        html
      end
      private
        # Replaces some characters with their corresponding HTML entities.
        def html_escape( string )
          string.gsub( /&/, "&amp;" ).
                 gsub( /</, "&lt;" ).
                 gsub( />/, "&gt;" ).
                 gsub( /"/, "&quot;" )
        end
    end
  end
 end
--- a/lib/syntax/lang/ruby.rb
+++ b/lib/syntax/lang/ruby.rb
@ -0,0 +1,317 @@
 require 'syntax'
 module Syntax
  # A tokenizer for the Ruby language. It recognizes all common syntax
  # (and some less common syntax) but because it is not a true lexer, it
  # will make mistakes on some ambiguous cases.
  class Ruby < Tokenizer
    # The list of all identifiers recognized as keywords.
    KEYWORDS =
      %w{if then elsif else end begin do rescue ensure while for
         class module def yield raise until unless and or not when
         case super undef break next redo retry in return alias
         defined?}
    # Perform ruby-specific setup
    def setup
      @selector = false
      @allow_operator = false
      @heredocs = []
    end
    # Step through a single iteration of the tokenization process.
    def step
      case
        when bol? && check( /=begin/ )
          start_group( :comment, scan_until( /^=end#{EOL}/ ) )
        when bol? && check( /__END__#{EOL}/ )
          start_group( :comment, scan_until( /\Z/ ) )
      else
        case
          when check( /def\s+/ )
            start_group :keyword, scan( /def\s+/ )
            start_group :method,  scan_until( /(?=[;(\s]|#{EOL})/ )
          when check( /class\s+/ )
            start_group :keyword, scan( /class\s+/ )
            start_group :class,  scan_until( /(?=[;\s<]|#{EOL})/ )
          when check( /module\s+/ )
            start_group :keyword, scan( /module\s+/ )
            start_group :module,  scan_until( /(?=[;\s]|#{EOL})/ )
          when check( /::/ )
            start_group :punct, scan(/::/)
          when check( /:"/ )
            start_group :symbol, scan(/:/)
            scan_delimited_region :symbol, :symbol, "", true
            @allow_operator = true
          when check( /:'/ )
            start_group :symbol, scan(/:/)
            scan_delimited_region :symbol, :symbol, "", false
            @allow_operator = true
          when scan( /:[_a-zA-Z@$][$@\w]*[=!?]?/ )
            start_group :symbol, matched
            @allow_operator = true
          when scan( /\?(\\[^\n\r]|[^\\\n\r\s])/ )
            start_group :char, matched
            @allow_operator = true
          when check( /(__FILE__|__LINE__|true|false|nil|self)[?!]?/ )
            if @selector || matched[-1] == ?? || matched[-1] == ?!
              start_group :ident,
                scan(/(__FILE__|__LINE__|true|false|nil|self)[?!]?/)
            else
              start_group :constant,
                scan(/(__FILE__|__LINE__|true|false|nil|self)/)
            end
            @selector = false
            @allow_operator = true
          when scan(/0([bB][01]+|[oO][0-7]+|[dD][0-9]+|[xX][0-9a-fA-F]+)/)
            start_group :number, matched
            @allow_operator = true
          else
            case peek(2)
              when "%r"
                scan_delimited_region :punct, :regex, scan( /../ ), true
                @allow_operator = true
              when "%w", "%q"
                scan_delimited_region :punct, :string, scan( /../ ), false
                @allow_operator = true
              when "%s"
                scan_delimited_region :punct, :symbol, scan( /../ ), false
                @allow_operator = true
              when "%W", "%Q", "%x"
                scan_delimited_region :punct, :string, scan( /../ ), true
                @allow_operator = true
              when /%[^\sa-zA-Z0-9]/
                scan_delimited_region :punct, :string, scan( /./ ), true
                @allow_operator = true
              when "<<"
                saw_word = ( chunk[-1,1] =~ /[\w!?]/ )
                start_group :punct, scan( /<</ )
                if saw_word
                  @allow_operator = false
                  return
                end
                float_right = scan( /-/ )
                append "-" if float_right
                if ( type = scan( /['"]/ ) )
                  append type
                  delim = scan_until( /(?=#{type})/ )
                  if delim.nil?
                    append scan_until( /\Z/ )
                    return
                  end
                else
                  delim = scan( /\w+/ ) or return
                end
                start_group :constant, delim
                start_group :punct, scan( /#{type}/ ) if type
                @heredocs << [ float_right, type, delim ]
                @allow_operator = true
              else
                case peek(1)
                  when /[\n\r]/
                    unless @heredocs.empty?
                      scan_heredoc(*@heredocs.shift)
                    else
                      start_group :normal, scan( /\s+/ )
                    end
                    @allow_operator = false
                  when /\s/
                    start_group :normal, scan( /\s+/ )
                  when "#"
                    start_group :comment, scan( /#[^\n\r]*/ )
                  when /[A-Z]/
                    start_group @selector ? :ident : :constant, scan( /\w+/ )
                    @allow_operator = true
                  when /[a-z_]/
                    word = scan( /\w+[?!]?/ )
                    if !@selector && KEYWORDS.include?( word )
                      start_group :keyword, word
                      @allow_operator = false
                    elsif
                      start_group :ident, word
                      @allow_operator = true
                    end
                    @selector = false
                  when /\d/
                    start_group :number,
                      scan( /[\d_]+(\.[\d_]+)?([eE][\d_]+)?/ )
                    @allow_operator = true
                  when '"'
                    scan_delimited_region :punct, :string, "", true
                    @allow_operator = true
                  when '/'
                    if @allow_operator
                      start_group :punct, scan(%r{/})
                      @allow_operator = false
                    else
                      scan_delimited_region :punct, :regex, "", true
                      @allow_operator = true
                    end
                  when "'"
                    scan_delimited_region :punct, :string, "", false
                    @allow_operator = true
                  when "."
                    dots = scan( /\.{1,3}/ )
                    start_group :punct, dots
                    @selector = ( dots.length == 1 )
                  when /[@]/
                    start_group :attribute, scan( /@{1,2}\w*/ )
                    @allow_operator = true
                  when /[$]/
                    start_group :global, scan(/\$/)
                    start_group :global, scan( /\w+|./ ) if check(/./)
                    @allow_operator = true
                  when /[-!?*\/+=<>(\[\{}:;,&|%]/
                    start_group :punct, scan(/./)
                    @allow_operator = false
                  when /[)\]]/
                    start_group :punct, scan(/./)
                    @allow_operator = true
                  else
                    # all else just falls through this, to prevent
                    # infinite loops...
                    append getch
                end
            end
        end
      end
    end
    private
      # Scan a delimited region of text. This handles the simple cases (strings
      # delimited with quotes) as well as the more complex cases of %-strings
      # and here-documents.
      #
      # * +delim_group+ is the group to use to classify the delimiters of the
      #   region
      # * +inner_group+ is the group to use to classify the contents of the
      #   region
      # * +starter+ is the text to use as the starting delimiter
      # * +exprs+ is a boolean flag indicating whether the region is an
      #   interpolated string or not
      # * +delim+ is the text to use as the delimiter of the region. If +nil+,
      #   the next character will be treated as the delimiter.
      # * +heredoc+ is either +false+, meaning the region is not a heredoc, or
      #   <tt>:flush</tt> (meaning the delimiter must be flushed left), or
      #   <tt>:float</tt> (meaning the delimiter doens't have to be flush left).
      def scan_delimited_region( delim_group, inner_group, starter, exprs,
        delim=nil, heredoc=false )
      # begin
        if !delim
          start_group delim_group, starter
          delim = scan( /./ )
          append delim
          delim = case delim
            when '{' then '}'
            when '(' then ')'
            when '[' then ']'
            when '<' then '>'
            else delim
          end
        end
        start_region inner_group
        items = "\\\\|"
        if heredoc
          items << "(^"
          items << '\s*' if heredoc == :float
          items << "#{Regexp.escape(delim)}\s*?)#{EOL}"
        else
          items << "#{Regexp.escape(delim)}"
        end
        items << "|#(\\$|@@?|\\{)" if exprs
        items = Regexp.new( items )
        loop do
          p = pos
          match = scan_until( items )
          if match.nil?
            start_group inner_group, scan_until( /\Z/ )
            break
          else
            text = pre_match[p..-1]
            start_group inner_group, text if text.length > 0
            case matched.strip
              when "\\"
                unless exprs
                  case peek(1)
                    when "'"
                      scan(/./)
                      start_group :escape, "\\'"
                    when "\\"
                      scan(/./)
                      start_group :escape, "\\\\"
                    else
                      start_group inner_group, "\\"
                  end
                else
                  start_group :escape, "\\"
                  c = getch
                  append c
                  case c
                    when 'x'
                      append scan( /[a-fA-F0-9]{1,2}/ )
                    when /[0-7]/
                      append scan( /[0-7]{0,2}/ )
                  end
                end
              when delim
                end_region inner_group
                start_group delim_group, matched
                break
              when /^#/
                do_highlight = (option(:expressions) == :highlight)
                start_region :expr if do_highlight
                start_group :expr, matched
                case matched[1]
                  when ?{
                    depth = 1
                    content = ""
                    while depth > 0
                      p = pos
                      c = scan_until( /[\{}]/ )
                      if c.nil?
                        content << scan_until( /\Z/ )
                        break
                      else
                        depth += ( matched == "{" ? 1 : -1 )
                        content << pre_match[p..-1]
                        content << matched if depth > 0
                      end
                    end
                    if do_highlight
                      subtokenize "ruby", content
                      start_group :expr, "}"
                    else
                      append content + "}"
                    end
                  when ?$, ?@
                    append scan( /\w+/ )
                end
                end_region :expr if do_highlight
              else raise "unexpected match on #{matched}"
            end
          end
        end
      end
      # Scan a heredoc beginning at the current position.
      #
      # * +float+ indicates whether the delimiter may be floated to the right
      # * +type+ is +nil+, a single quote, or a double quote
      # * +delim+ is the delimiter to look for
      def scan_heredoc(float, type, delim)
        scan_delimited_region( :constant, :string, "", type != "'",
          delim, float ? :float : :flush )
      end
  end
  SYNTAX["ruby"] = Ruby
 end
--- a/lib/syntax/lang/xml.rb
+++ b/lib/syntax/lang/xml.rb
@ -0,0 +1,108 @@
 require 'syntax'
 module Syntax
  # A simple implementation of an XML lexer. It handles most cases. It is
  # not a validating lexer, meaning it will happily process invalid XML without
  # complaining.
  class XML < Tokenizer
    # Initialize the lexer.
    def setup
      @in_tag = false
    end
    # Step through a single iteration of the tokenization process. This will
    # yield (potentially) many tokens, and possibly zero tokens.
    def step
      start_group :normal, matched if scan( /\s+/ )
      if @in_tag
        case
          when scan( /([-\w]+):([-\w]+)/ )
            start_group :namespace, subgroup(1)
            start_group :punct, ":"
            start_group :attribute, subgroup(2)
          when scan( /\d+/ )
            start_group :number, matched
          when scan( /[-\w]+/ )
            start_group :attribute, matched
          when scan( %r{[/?]?>} )
            @in_tag = false
            start_group :punct, matched
          when scan( /=/ )
            start_group :punct, matched
          when scan( /["']/ )
            scan_string matched
          else
            append getch
        end
      elsif ( text = scan_until( /(?=[<&])/ ) )
        start_group :normal, text unless text.empty?
        if scan(/<!--.*?(-->|\Z)/m)
          start_group :comment, matched
        else
          case peek(1)
            when "<"
              start_group :punct, getch
              case peek(1)
                when "?"
                  append getch
                when "/"
                  append getch
                when "!"
                  append getch
              end
              start_group :normal, matched if scan( /\s+/ )
              if scan( /([-\w]+):([-\w]+)/ )
                start_group :namespace, subgroup(1)
                start_group :punct, ":"
                start_group :tag, subgroup(2)
              elsif scan( /[-\w]+/ )
                start_group :tag, matched
              end
              @in_tag = true
            when "&"
              if scan( /&\S{1,10};/ )
                start_group :entity, matched
              else
                start_group :normal, scan( /&/ )
              end
          end
        end
      else
        append scan_until( /\Z/ )
      end
    end
    private
      # Scan the string starting at the current position, with the given
      # delimiter character.
      def scan_string( delim )
        start_group :punct, delim
        match = /(?=[&\\]|#{delim})/
        loop do
          break unless ( text = scan_until( match ) )
          start_group :string, text unless text.empty?
          case peek(1)
            when "&"
              if scan( /&\S{1,10};/ )
                start_group :entity, matched
              else
                start_group :string, getch
              end
            when "\\"
              start_group :string, getch
              append getch || ""
            when delim
              start_group :punct, getch
              break
          end
        end
      end
  end
  SYNTAX["xml"] = XML
 end
--- a/lib/syntax/lang/yaml.rb
+++ b/lib/syntax/lang/yaml.rb
@ -0,0 +1,105 @@
 require 'syntax'
 module Syntax
  # A simple implementation of an YAML lexer. It handles most cases. It is
  # not a validating lexer.
  class YAML < Tokenizer
    # Step through a single iteration of the tokenization process. This will
    # yield (potentially) many tokens, and possibly zero tokens.
    def step
      if bol?
        case
          when scan(/---(\s*.+)?$/)
            start_group :document, matched
          when scan(/(\s*)([a-zA-Z][-\w]*)(\s*):/)
            start_group :normal, subgroup(1)
            start_group :key, subgroup(2)
            start_group :normal, subgroup(3)
            start_group :punct, ":"
          when scan(/(\s*)-/)
            start_group :normal, subgroup(1)
            start_group :punct, "-"
          when scan(/\s*$/)
            start_group :normal, matched
          when scan(/#.*$/)
            start_group :comment, matched
          else
            append getch
        end
      else
        case
          when scan(/[\n\r]+/)
            start_group :normal, matched
          when scan(/[ \t]+/)
            start_group :normal, matched
          when scan(/!+(.*?^)?\S+/)
            start_group :type, matched
          when scan(/&\S+/)
            start_group :anchor, matched
          when scan(/\*\S+/)
            start_group :ref, matched
          when scan(/\d\d:\d\d:\d\d/)
            start_group :time, matched
          when scan(/\d\d\d\d-\d\d-\d\d\s\d\d:\d\d:\d\d(\.\d+)? [-+]\d\d:\d\d/)
            start_group :date, matched
          when scan(/['"]/)
            start_group :punct, matched
            scan_string matched
          when scan(/:\w+/)
            start_group :symbol, matched
          when scan(/[:]/)
            start_group :punct, matched
          when scan(/#.*$/)
            start_group :comment, matched
          when scan(/>-?/)
            start_group :punct, matched
            start_group :normal, scan(/.*$/)
            append getch until eos? || bol?
            return if eos?
            indent = check(/ */)
            start_group :string
            loop do
              line = check_until(/[\n\r]|\Z/)
              break if line.nil?
              if line.chomp.length > 0
                this_indent = line.chomp.match( /^\s*/ )[0]
                break if this_indent.length < indent.length
              end
              append scan_until(/[\n\r]|\Z/)
            end
          else
            start_group :normal, scan_until(/(?=$|#)/)
        end
      end
    end
    private
      def scan_string( delim )
        regex = /(?=[#{delim=="'" ? "" : "\\\\"}#{delim}])/
        loop do
          text = scan_until( regex )
          if text.nil?
            start_group :string, scan_until( /\Z/ )
            break
          else
            start_group :string, text unless text.empty?
          end
          case peek(1)
            when "\\"
              start_group :expr, scan(/../)
            else
              start_group :punct, getch
              break
          end
        end
      end
  end
  SYNTAX["yaml"] = YAML
 end
--- a/lib/syntax/version.rb
+++ b/lib/syntax/version.rb
@ -0,0 +1,9 @@
 module Syntax
  module Version
    MAJOR=1
    MINOR=0
    TINY=0
    STRING=[MAJOR,MINOR,TINY].join('.')
  end
 end
--- a/log/production.log
+++ b/log/production.log
@ -0,0 +1,3 @@
 # Logfile created on Mon Jan 22 07:45:04 CST 2007 by logger.rb/1.5.2.7
 Migrating to Beta1Schema (1)
 Migrating to Beta2ChangesBulk (2)
--- a/public/stylesheets/instiki.css
+++ b/public/stylesheets/instiki.css
@ -318,3 +318,8 @@ border:none;
 margin:0;
 padding:0;
 }
 merror {display:inline;font-size:1em;}
 math[display=block] {overflow:auto;}
 math { white-space: nowrap }
 .maruku-eq-number {float:right}