diff --git a/Commands/Generate.plist b/Commands/Generate.plist new file mode 100644 index 0000000..ffe0927 --- /dev/null +++ b/Commands/Generate.plist @@ -0,0 +1,132 @@ + + + + + beforeRunningCommand + saveActiveFile + command + #!/usr/bin/env ruby -s + +require 'erb' + +def markdown_text (text) + text.gsub(/`(.*?)`/, '<code>\1</code>') +end + +def make_id (text) + text = text.gsub(/`(.*?)`/, '\1') + text.gsub!(/[- \/_]+/, '_') + text.gsub!(/[^a-zA-Z0-9_]+/, '') + text.downcase +end + +Dir.chdir(ENV['TM_PROJECT_DIRECTORY']) + +$toc = [ "<h1>Table of Contents</h1>" ] +$chapters = [ ] + +$toc_template = "templates/toc.rhtml" if $toc_template.nil? +$chapter_template = "templates/chapter.rhtml" if $chapter_template.nil? +$all_template = "templates/all.rhtml" if $all_template.nil? +$output_dir = "html" if $output_dir.nil? + +files = Dir.entries("pages").sort.grep(/.*\.markdown/) +files.each_with_index do |file, i| + + def html_link (markdown_file) + markdown_file.sub(/^(?:\d+ )?(.*?)\.markdown$/, '\1.html') + end + + puts "• Convert #{file}…" + + $page_toc = [ ] + + IO.popen('"' + ENV['TM_BUNDLE_SUPPORT'] + '/bin/MultiMarkdown.pl"| "' + ENV['TM_SUPPORT_PATH'] + '/bin/SmartyPants.pl"| "' + ENV['TM_BUNDLE_SUPPORT'] + '"/add_image_size.rb', "r+") do |f| + + Thread.fork do + heading_stack = [ i ] + lastlevel = 0; + File.open("pages/#{file}").each_line do |line| + + if(m = line.match(/^(#+)\s+(.*)$/)) + level = m[1].length + title = m[2] + + if heading_stack.length < level + heading_stack.push(0) +# $toc.push("<ol>") + else + while heading_stack.length > level + heading_stack.pop +# $toc.push("</ol>") + end + end + + heading_stack.push(heading_stack.pop + 1) + prefix = heading_stack.join(".") + puts(" #{prefix} #{title}") + + toc_entry = "#{"<ul><li>" if(level > lastlevel)}#{"</li><li>" if(level == lastlevel)}#{"</li></ul>" * (lastlevel - level) if(level < lastlevel)}<span class='toc_number'>#{prefix}</span><a href='#{html_link file}##{make_id title}'>#{markdown_text title}</a>"; + + $toc.push(toc_entry) + $page_toc.push(toc_entry) + + f.write("#{m[1]} <span id='#{make_id title}'>#{prefix}</span> #{title}") + lastlevel = level; + else + f.write(line) + end + + end + + lastlevel.times {$page_toc.push("</li></ul>")} + begin + f.write("\n"+File.open("markdown.references").read) + rescue + + end + f.close_write + + lastlevel.times {$toc.push("</li></ul>")} +# heading_stack.length.times { $toc.push("</ol>") } + end + + $page = { :title => %x{ grep '^#' 'pages/#{file}'|head -n1 }.sub(/^#+\s+(.*)\n/, '\1'), :content => f.read, :name => "chapter", :page_toc => $page_toc.join("\n") } + $prev = i > 0 ? { :link => "#{html_link files[i-1]}", :title => markdown_text(%x{ grep '^#' 'pages/#{files[i-1]}'|head -n1 }.sub(/^#+\s+(.*)\n/, '\1')) } : nil + $next = i + 1 < files.length ? { :link => "#{html_link files[i+1]}", :title => markdown_text(%x{ grep '^#' 'pages/#{files[i+1]}'|head -n1 }.sub(/^#+\s+(.*)\n/, '\1')) } : nil + + File.open("#{$output_dir}/#{html_link file}", "w") do |f| + f.write(ERB.new(File.open($chapter_template), 0, '<>').result) + end + + $chapters.push($page) + + end + +end + +$alltoc = { :toc => $toc.join("\n") } +File.open("#{$output_dir}/all_pages.html", "w") do |f| + f.write(ERB.new(File.open($all_template), 0, '<>').result) +end + + +File.open("#{$output_dir}/index.html", "w") do |f| + $page = { :content => $toc.join("\n"), :name => "toc", :title => "Table of Contents" } + f.write(ERB.new(File.open($toc_template), 0, '<>').result) +end + + input + none + keyEquivalent + ^G + name + Generate + output + showAsTooltip + scope + text.html.markdown + uuid + C445442D-06BF-4CEE-A642-6209B84632A6 + + diff --git a/Commands/Open Generated Stuff.plist b/Commands/Open Generated Stuff.plist new file mode 100644 index 0000000..5f13402 --- /dev/null +++ b/Commands/Open Generated Stuff.plist @@ -0,0 +1,22 @@ + + + + + beforeRunningCommand + nop + command + open "$TM_PROJECT_DIRECTORY/html/index.html" + input + none + keyEquivalent + ^O + name + Open Generated Files + output + discard + scope + text.html.markdown + uuid + B3AF90C8-A1B0-4583-A5E4-74374B68B015 + + diff --git a/Commands/Readme.plist b/Commands/Readme.plist new file mode 100644 index 0000000..7e44dc5 --- /dev/null +++ b/Commands/Readme.plist @@ -0,0 +1,21 @@ + + + + + beforeRunningCommand + nop + command + . "$TM_SUPPORT_PATH/lib/webpreview.sh" +html_header "Markdown2Book Help file" "Markdown2Book" +Markdown.pl "$TM_BUNDLE_SUPPORT/help.markdown"|SmartyPants.pl +html_footer + input + none + name + Readme + output + showAsHTML + uuid + B9B57AA0-0024-41F6-B6AE-C60FCDC1E8B1 + + diff --git a/Commands/Show References.plist b/Commands/Show References.plist new file mode 100644 index 0000000..ef31d40 --- /dev/null +++ b/Commands/Show References.plist @@ -0,0 +1,34 @@ + + + + + beforeRunningCommand + nop + command + res=$(CocoaDialog dropdown --text "References" --items `cat "$TM_PROJECT_DIRECTORY/markdown.references"|sed 's/ /_/'` --button1 "Insert") + +[[ $(head -n1 <<<"$res") == "2" ]] && exit_discard + +res=$(tail -n1 <<<"$res") + +let "res += 2" + +res=$(head -n "$res" "$TM_PROJECT_DIRECTORY/markdown.references" |tail -n 1) + +res=$(sed 's/\[\(.*\)\].*/[${1:Reference text}][\1]/'<<<"$res") + +echo -n "$res" + input + none + keyEquivalent + ^l + name + Show References + output + insertAsSnippet + scope + text.html.markdown + uuid + 3E0EDBF3-2018-46EA-95EE-C4EB20118789 + + diff --git a/Commands/Update References.plist b/Commands/Update References.plist new file mode 100644 index 0000000..03d53da --- /dev/null +++ b/Commands/Update References.plist @@ -0,0 +1,43 @@ + + + + + beforeRunningCommand + nop + command + #!/bin/bash + +cd "$TM_PROJECT_DIRECTORY" + +if [ ! -f "markdown.references" ]; then touch "markdown.references"; fi + +all_refs=$(grep -ho '\[[^]]*\]\[[^]]*\]' pages/*.markdown|perl -pe 's/.*\[(.*)\]$/$1/'|sort|uniq) + +known_refs=$(grep '^\[.*\]' markdown.references|perl -pe 's/^\[(.*?)\].*/$1/') + +all_ptrn=$(tr <<<"$all_refs" '\n' '|') +known_ptrn=$(tr <<<"$known_refs" '\n' '|') + +all_ptrn="${all_ptrn:0:${#all_ptrn}-1}" +known_ptrn="${known_ptrn:0:${#known_ptrn}-1}" + +echo -e "Missing:\n" +grep -Ev <<<"$all_refs" "^($known_ptrn)$"|perl -pe 's/.*/[$&]: MISSING/'|tee -a markdown.references + +echo -e "\nRedundant:\n" +grep -Ev <<<"$known_refs" "^($all_ptrn)$" + + input + none + keyEquivalent + ^U + name + Update References + output + showAsTooltip + scope + text + uuid + 749EA16A-700B-43B3-9457-FA12D8301CAE + + diff --git a/README b/README new file mode 100644 index 0000000..4fc0de2 --- /dev/null +++ b/README @@ -0,0 +1 @@ +This TextMate bundle is for compiling a Documentation project made of several Markdown files to HTML. It generates a TOC, a print version with all chapters on one page and HTML files for each chapter. You can use references to easily link between your pages. \ No newline at end of file diff --git a/Support/add_image_size.rb b/Support/add_image_size.rb new file mode 100755 index 0000000..cd6edad --- /dev/null +++ b/Support/add_image_size.rb @@ -0,0 +1,12 @@ +#!/usr/bin/env ruby + +STDIN.each_line do |line| + line.gsub!(/]*?(?:width|height)=)[^>*]src="(.*?)"/) do |tag| + size = %x(sips -g pixelWidth -g pixelHeight "#{$1}") + size.gsub(/pixel(Width|Height): (\d+)/) { |str| tag += " #{$1.downcase}=\"#{$2}\"" } + # use the next line to change the image path + # tag.gsub(/src="([^"]+)"/, 'src="http://yoursite.com/path/to/images/\1"') + tag.gsub(/src="([^"]+)"/, 'src="\1"') + end + print line +end diff --git a/Support/bin/MultiMarkdown.pl b/Support/bin/MultiMarkdown.pl new file mode 100755 index 0000000..620f5b9 --- /dev/null +++ b/Support/bin/MultiMarkdown.pl @@ -0,0 +1,2216 @@ +#!/usr/bin/env perl + +# MultiMarkdown -- A modification of John Gruber's original Markdown +# that adds new features and an output format that can more readily +# be converted into other document formats +# +# Original Code Copyright (c) 2004 John Gruber +# +# +# MultiMarkdown changes Copyright (c) 2005-2006 Fletcher T. Penney +# +# + + +package Markdown; +require 5.006_000; +use strict; +use warnings; + +use Digest::MD5 qw(md5_hex); +use vars qw($VERSION $g_use_metadata $g_use_wiki_links $g_base_url); +$VERSION = '1.0.1Multi19.1'; + +## Disabled; causes problems under Perl 5.6.1: +# use utf8; +# binmode( STDOUT, ":utf8" ); # c.f.: http://acis.openlib.org/dev/perl-unicode-struggle.html + + +# +# Global default settings: +# +my $g_empty_element_suffix = " />"; # Change to ">" for HTML output +my $g_tab_width = 4; + + +# +# Globals: +# + +# Regex to match balanced [brackets]. See Friedl's +# "Mastering Regular Expressions", 2nd Ed., pp. 328-331. +my $g_nested_brackets; +$g_nested_brackets = qr{ + (?> # Atomic matching + [^\[\]]+ # Anything other than brackets + | + \[ + (??{ $g_nested_brackets }) # Recursive set of nested brackets + \] + )* +}x; + + +# Table of hash values for escaped characters: +my %g_escape_table; +foreach my $char (split //, '\\`*_{}[]()>#+-.!') { + $g_escape_table{$char} = md5_hex($char); +} + + +# Global hashes, used by various utility routines +my %g_urls; +my %g_titles; +my %g_html_blocks; +my %g_metadata = (); +my %g_metadata_newline; +my %g_crossrefs; +my %g_footnotes; +my %g_attributes; +my @g_used_footnotes; +my $g_footnote_counter = 0; +my %g_citations; + +my $g_citation_counter = 0; +my @g_used_references; +my %g_references; + +$g_use_metadata = 1; +$g_metadata_newline{default} = "\n"; +my $g_document_format = ""; + +# For use with WikiWords and [[Wiki Links]] +$g_use_wiki_links = 0; +$g_base_url = ""; # This is the base url to be used for WikiLinks +my $g_temp_no_wikiwords = 0; + +# NOTE: +# You can use \WikiWord to prevent a WikiWord from being treated as a link + + +# Used to track when we're inside an ordered or unordered list +# (see _ProcessListItems() for details): +my $g_list_level = 0; + + +#### Blosxom plug-in interface ########################################## + +# Set $g_blosxom_use_meta to 1 to use Blosxom's meta plug-in to determine +# which posts Markdown should process, using a "meta-markup: markdown" +# header. If it's set to 0 (the default), Markdown will process all +# entries. +my $g_blosxom_use_meta = 0; + +sub start { 1; } +sub story { + my($pkg, $path, $filename, $story_ref, $title_ref, $body_ref) = @_; + + if ( (! $g_blosxom_use_meta) or + (defined($meta::markup) and ($meta::markup =~ /^\s*markdown\s*$/i)) + ){ + $$body_ref = Markdown($$body_ref); + } + 1; +} + + +#### Movable Type plug-in interface ##################################### +eval {require MT}; # Test to see if we're running in MT. +unless ($@) { + require MT; + import MT; + require MT::Template::Context; + import MT::Template::Context; + + eval {require MT::Plugin}; # Test to see if we're running >= MT 3.0. + unless ($@) { + require MT::Plugin; + import MT::Plugin; + my $plugin = new MT::Plugin({ + name => "Markdown", + description => "A plain-text-to-HTML formatting plugin. (Version: $VERSION)", + doc_link => 'http://daringfireball.net/projects/markdown/' + }); + MT->add_plugin( $plugin ); + } + + MT::Template::Context->add_container_tag(MarkdownOptions => sub { + my $ctx = shift; + my $args = shift; + my $builder = $ctx->stash('builder'); + my $tokens = $ctx->stash('tokens'); + + if (defined ($args->{'output'}) ) { + $ctx->stash('markdown_output', lc $args->{'output'}); + } + + defined (my $str = $builder->build($ctx, $tokens) ) + or return $ctx->error($builder->errstr); + $str; # return value + }); + + MT->add_text_filter('markdown' => { + label => 'Markdown', + docs => 'http://daringfireball.net/projects/markdown/', + on_format => sub { + my $text = shift; + my $ctx = shift; + my $raw = 0; + if (defined $ctx) { + my $output = $ctx->stash('markdown_output'); + if (defined $output && $output =~ m/^html/i) { + $g_empty_element_suffix = ">"; + $ctx->stash('markdown_output', ''); + } + elsif (defined $output && $output eq 'raw') { + $raw = 1; + $ctx->stash('markdown_output', ''); + } + else { + $raw = 0; + $g_empty_element_suffix = " />"; + } + } + $text = $raw ? $text : Markdown($text); + $text; + }, + }); + + # If SmartyPants is loaded, add a combo Markdown/SmartyPants text filter: + my $smartypants; + + { + no warnings "once"; + $smartypants = $MT::Template::Context::Global_filters{'smarty_pants'}; + } + + if ($smartypants) { + MT->add_text_filter('markdown_with_smartypants' => { + label => 'Markdown With SmartyPants', + docs => 'http://daringfireball.net/projects/markdown/', + on_format => sub { + my $text = shift; + my $ctx = shift; + if (defined $ctx) { + my $output = $ctx->stash('markdown_output'); + if (defined $output && $output eq 'html') { + $g_empty_element_suffix = ">"; + } + else { + $g_empty_element_suffix = " />"; + } + } + $text = Markdown($text); + $text = $smartypants->($text, '1'); + }, + }); + } +} +else { +#### BBEdit/command-line text filter interface ########################## +# Needs to be hidden from MT (and Blosxom when running in static mode). + + # We're only using $blosxom::version once; tell Perl not to warn us: + no warnings 'once'; + unless ( defined($blosxom::version) ) { + use warnings; + + #### Check for command-line switches: ################# + my %cli_opts; + use Getopt::Long; + Getopt::Long::Configure('pass_through'); + GetOptions(\%cli_opts, + 'version', + 'shortversion', + 'html4tags', + ); + if ($cli_opts{'version'}) { # Version info + print "\nThis is Markdown, version $VERSION.\n"; + print "Copyright 2004 John Gruber\n"; + print "http://daringfireball.net/projects/markdown/\n\n"; + exit 0; + } + if ($cli_opts{'shortversion'}) { # Just the version number string. + print $VERSION; + exit 0; + } + if ($cli_opts{'html4tags'}) { # Use HTML tag style instead of XHTML + $g_empty_element_suffix = ">"; + } + + + #### Process incoming text: ########################### + my $text; + { + local $/; # Slurp the whole file + $text = <>; + } + print Markdown($text); + } +} + + + +sub Markdown { +# +# Main function. The order in which other subs are called here is +# essential. Link and image substitutions need to happen before +# _EscapeSpecialChars(), so that any *'s or _'s in the +# and tags get encoded. +# + my $text = shift; + + # Clear the global hashes. If we don't clear these, you get conflicts + # from other articles when generating a page which contains more than + # one article (e.g. an index page that shows the N most recent + # articles): + %g_urls = (); + %g_titles = (); + %g_html_blocks = (); + %g_metadata = (); + %g_crossrefs = (); + %g_footnotes = (); + @g_used_footnotes = (); + + + + # Standardize line endings: + $text =~ s{\r\n}{\n}g; # DOS to Unix + $text =~ s{\r}{\n}g; # Mac to Unix + + # Make sure $text ends with a couple of newlines: + $text .= "\n\n"; + + # Convert all tabs to spaces. + $text = _Detab($text); + + # Strip any lines consisting only of spaces and tabs. + # This makes subsequent regexen easier to write, because we can + # match consecutive blank lines with /\n+/ instead of something + # contorted like /[ \t]*\n+/ . + $text =~ s/^[ \t]+$//mg; + + # Strip leading blank lines + $text =~ s/^\n+//s; + + # Strip out MetaData + $text = _ParseMetaData($text) if $g_use_metadata; + + # And recheck for leading blank lines + $text =~ s/^\n+//s; + + # Turn block-level HTML blocks into hash entries + $text = _HashHTMLBlocks($text); + + # Strip link definitions, store in hashes. + $text = _StripLinkDefinitions($text); + + $text = _StripFootnoteDefinitions($text); + + $text = _StripMarkdownReferences($text); + + $text = _RunBlockGamut($text); + + $text = _DoMarkdownCitations($text); + + $text = _DoFootnotes($text); + + $text = _UnescapeSpecialChars($text); + + # This must follow _UnescapeSpecialChars + $text = _UnescapeWikiWords($text); + + $text = _FixFootnoteParagraphs($text); + $text .= _PrintFootnotes(); + + $text .= _PrintMarkdownBibliography(); + + $text = _ConvertCopyright($text); + + if (lc($g_document_format) =~ /^complete\s*$/) { + return xhtmlMetaData() . "\n" . $text . "\n\n"; + } else { + return textMetaData() . $text . "\n"; + } + +} + + +sub _StripLinkDefinitions { +# +# Strips link definitions from text, stores the URLs and titles in +# hash references. +# + my $text = shift; + my $less_than_tab = $g_tab_width - 1; + + # Link defs are in the form: ^[id]: url "optional title" + while ($text =~ s{ + ^[ ]{0,$less_than_tab}\[(.+)\]: # id = $1 + [ \t]* + \n? # maybe *one* newline + [ \t]* + ? # url = $2 + [ \t]* + \n? # maybe one newline + [ \t]* + (?: + (?<=\s) # lookbehind for whitespace + ["(] + (.+?) # title = $3 + [")] + [ \t]* + )? # title is optional + + # MultiMarkdown addition for attribute support + \n? + ( # Attributes = $4 + (?<=\s) # lookbehind for whitespace + (([ \t]*\n)?[ \t]*((\S+=\S+)|(\S+=".*?")))* + )? + [ \t]* + # /addition + (?:\n+|\Z) + } + {}mx) { + $g_urls{lc $1} = _EncodeAmpsAndAngles( $2 ); # Link IDs are case-insensitive + if ($3) { + $g_titles{lc $1} = $3; + $g_titles{lc $1} =~ s/"/"/g; + } + + # MultiMarkdown addition " + if ($4) { + $g_attributes{lc $1} = $4; + } + # /addition + } + + return $text; +} + + +sub _HashHTMLBlocks { + my $text = shift; + my $less_than_tab = $g_tab_width - 1; + + # Hashify HTML blocks: + # We only want to do this for block-level HTML tags, such as headers, + # lists, and tables. That's because we still want to wrap

s around + # "paragraphs" that are wrapped in non-block-level tags, such as anchors, + # phrase emphasis, and spans. The list of tags we're looking for is + # hard-coded: + my $block_tags_a = qr/p|div|h[1-6]|blockquote|pre|table|dl|ol|ul|script|noscript|form|fieldset|iframe|math|ins|del/; + my $block_tags_b = qr/p|div|h[1-6]|blockquote|pre|table|dl|ol|ul|script|noscript|form|fieldset|iframe|math/; + + # First, look for nested blocks, e.g.: + #

+ #
+ # tags for inner block must be indented. + #
+ #
+ # + # The outermost tags must start at the left margin for this to match, and + # the inner nested divs must be indented. + # We need to do this before the next, more liberal match, because the next + # match will start at the first `
` and stop at the first `
`. + $text =~ s{ + ( # save in $1 + ^ # start of line (with /m) + <($block_tags_a) # start tag = $2 + \b # word break + (.*\n)*? # any number of lines, minimally matching + # the matching end tag + [ \t]* # trailing spaces/tabs + (?=\n+|\Z) # followed by a newline or end of document + ) + }{ + my $key = md5_hex($1); + $g_html_blocks{$key} = $1; + "\n\n" . $key . "\n\n"; + }egmx; + + + # + # Now match more liberally, simply from `\n` to `\n` + # + $text =~ s{ + ( # save in $1 + ^ # start of line (with /m) + <($block_tags_b) # start tag = $2 + \b # word break + (.*\n)*? # any number of lines, minimally matching + .* # the matching end tag + [ \t]* # trailing spaces/tabs + (?=\n+|\Z) # followed by a newline or end of document + ) + }{ + my $key = md5_hex($1); + $g_html_blocks{$key} = $1; + "\n\n" . $key . "\n\n"; + }egmx; + # Special case just for
. It was easier to make a special case than + # to make the other regex more complicated. + $text =~ s{ + (?: + (?<=\n\n) # Starting after a blank line + | # or + \A\n? # the beginning of the doc + ) + ( # save in $1 + [ ]{0,$less_than_tab} + <(hr) # start tag = $2 + \b # word break + ([^<>])*? # + /?> # the matching end tag + [ \t]* + (?=\n{2,}|\Z) # followed by a blank line or end of document + ) + }{ + my $key = md5_hex($1); + $g_html_blocks{$key} = $1; + "\n\n" . $key . "\n\n"; + }egx; + + # Special case for standalone HTML comments: + $text =~ s{ + (?: + (?<=\n\n) # Starting after a blank line + | # or + \A\n? # the beginning of the doc + ) + ( # save in $1 + [ ]{0,$less_than_tab} + (?s: + + ) + [ \t]* + (?=\n{2,}|\Z) # followed by a blank line or end of document + ) + }{ + my $key = md5_hex($1); + $g_html_blocks{$key} = $1; + "\n\n" . $key . "\n\n"; + }egx; + + + return $text; +} + + +sub _RunBlockGamut { +# +# These are all the transformations that form block-level +# tags like paragraphs, headers, and list items. +# + my $text = shift; + + # Do tables first to populate the table id's for cross-refs + # Escape
 so we don't get greedy with tables
+	$text = _DoTables($text);
+	
+	# And now, protect our tables
+	$text = _HashHTMLBlocks($text);
+
+
+	$text = _DoHeaders($text);
+
+	# Do Horizontal Rules:
+	$text =~ s{^[ ]{0,2}([ ]?\*[ ]?){3,}[ \t]*$}{\n tags around block-level tags.
+	$text = _HashHTMLBlocks($text);
+
+	# Escape 
 so we don't get greedy with tables
+#	$text = _DoTables($text);
+	
+	# And now, protect our tables
+#	$text = _HashHTMLBlocks($text);
+
+	$text = _FormParagraphs($text);
+
+	return $text;
+}
+
+
+sub _RunSpanGamut {
+#
+# These are all the transformations that occur *within* block-level
+# tags like paragraphs, headers, and list items.
+#
+	my $text = shift;
+
+	$text = _DoCodeSpans($text);
+
+	$text = _EscapeSpecialChars($text);
+
+	# Process anchor and image tags. Images must come first,
+	# because ![foo][f] looks like an anchor.
+	$text = _DoImages($text);
+	$text = _DoAnchors($text);
+
+	# Process WikiWords
+	if ($g_use_wiki_links && !$g_temp_no_wikiwords) {
+		$text = _DoWikiLinks($text);
+		
+		# And then reprocess anchors and images
+		$text = _DoImages($text);
+		$text = _DoAnchors($text);
+	}
+	
+
+	# Make links out of things like ``
+	# Must come after _DoAnchors(), because you can use < and >
+	# delimiters in inline links like [this]().
+	$text = _DoAutoLinks($text);
+
+	$text = _EncodeAmpsAndAngles($text);
+
+	$text = _DoItalicsAndBold($text);
+
+	# Do hard breaks:
+	$text =~ s/ {2,}\n/  or  tags.
+# 	my $tags_to_skip = qr!<(/?)(?:pre|code|kbd|script|math)[\s>]!;
+
+	foreach my $cur_token (@$tokens) {
+		if ($cur_token->[0] eq "tag") {
+			# Within tags, encode * and _ so they don't conflict
+			# with their use in Markdown for italics and strong.
+			# We're replacing each such character with its
+			# corresponding MD5 checksum value; this is likely
+			# overkill, but it should prevent us from colliding
+			# with the escape values by accident.
+			$cur_token->[1] =~  s! \* !$g_escape_table{'*'}!gx;
+			$cur_token->[1] =~  s! _  !$g_escape_table{'_'}!gx;
+			$text .= $cur_token->[1];
+		} else {
+			my $t = $cur_token->[1];
+			$t = _EncodeBackslashEscapes($t);
+			$text .= $t;
+		}
+	}
+	return $text;
+}
+
+
+sub _DoAnchors {
+#
+# Turn Markdown link shortcuts into XHTML  tags.
+#
+	my $text = shift;
+
+	#
+	# First, handle reference-style links: [link text] [id]
+	#
+	$text =~ s{
+		(					# wrap whole match in $1
+		  \[
+		    ($g_nested_brackets)	# link text = $2
+		  \]
+
+		  [ ]?				# one optional space
+		  (?:\n[ ]*)?		# one optional newline followed by spaces
+
+		  \[
+		    (.*?)		# id = $3
+		  \]
+		)
+	}{
+		my $result;
+		my $whole_match = $1;
+		my $link_text   = $2;
+		my $link_id     = lc $3;
+
+		if ($link_id eq "") {
+			$link_id = lc $link_text;	# for shortcut links like [this][].
+		}
+
+		# Allow automatic cross-references to headers
+		my $label = Header2Label($link_id);
+		if (defined $g_crossrefs{$label}) {
+			my $url = $g_crossrefs{$label};
+			$url =~ s! \* !$g_escape_table{'*'}!gx;		# We've got to encode these to avoid
+			$url =~ s!  _ !$g_escape_table{'_'}!gx;		# conflicting with italics/bold.
+			$result = "?	# href = $3
+		  	[ \t]*
+			(			# $4
+			  (['"])	# quote char = $5
+			  (.*?)		# Title = $6
+			  \5		# matching quote
+			)?			# title is optional
+		  \)
+		)
+	}{
+		my $result;
+		my $whole_match = $1;
+		my $link_text   = $2;
+		my $url	  		= $3;
+		my $title		= $6;
+
+		$url =~ s! \* !$g_escape_table{'*'}!gx;		# We've got to encode these to avoid
+		$url =~ s!  _ !$g_escape_table{'_'}!gx;		# conflicting with italics/bold.
+		$result = " tags.
+#
+	my $text = shift;
+
+	#
+	# First, handle reference-style labeled images: ![alt text][id]
+	#
+	$text =~ s{
+		(				# wrap whole match in $1
+		  !\[
+		    (.*?)		# alt text = $2
+		  \]
+
+		  [ ]?				# one optional space
+		  (?:\n[ ]*)?		# one optional newline followed by spaces
+
+		  \[
+		    (.*?)		# id = $3
+		  \]
+
+		)
+	}{
+		my $result;
+		my $whole_match = $1;
+		my $alt_text    = $2;
+		my $link_id     = lc $3;
+
+		if ($link_id eq "") {
+			$link_id = lc $alt_text;     # for shortcut links like ![this][].
+		}
+
+		$alt_text =~ s/"/"/g;
+		if (defined $g_urls{$link_id}) {
+			my $url = $g_urls{$link_id};
+			$url =~ s! \* !$g_escape_table{'*'}!gx;		# We've got to encode these to avoid
+			$url =~ s!  _ !$g_escape_table{'_'}!gx;		# conflicting with italics/bold.
+			
+			my $label = Header2Label($alt_text);
+			$g_crossrefs{$label} = "#$label";
+			if (! defined $g_titles{$link_id}) {
+				$g_titles{$link_id} = $alt_text;
+			}
+			
+			$result = "\"$alt_text\"";?	# src url = $3
+		  	[ \t]*
+			(			# $4
+			  (['"])	# quote char = $5
+			  (.*?)		# title = $6
+			  \5		# matching quote
+			  [ \t]*
+			)?			# title is optional
+		  \)
+		)
+	}{
+		my $result;
+		my $whole_match = $1;
+		my $alt_text    = $2;
+		my $url	  		= $3;
+		my $title		= '';
+		if (defined($6)) {
+			$title		= $6;
+		}
+
+		$alt_text =~ s/"/"/g;
+		$title    =~ s/"/"/g;
+		$url =~ s! \* !$g_escape_table{'*'}!gx;		# We've got to encode these to avoid
+		$url =~ s!  _ !$g_escape_table{'_'}!gx;		# conflicting with italics/bold.
+
+		my $label = Header2Label($alt_text);
+		$g_crossrefs{$label} = "#$label";
+#		$g_titles{$label} = $alt_text;			# I think this line should not be here
+			
+		$result = "\"$alt_text\"";"  .  _RunSpanGamut($1)  .  "\n\n";
+	}egmx;
+
+	$text =~ s{ ^(.+)[ \t]*\n-+[ \t]*\n+ }{
+		$label = Header2Label($1);
+		$header = _RunSpanGamut($1);
+		
+		$g_crossrefs{$label} = "#$label";
+		$g_titles{$label} = $header;
+		
+		"

" . _RunSpanGamut($1) . "

\n\n"; + }egmx; + + + # atx-style headers: + # # Header 1 + # ## Header 2 + # ## Header 2 with closing hashes ## + # ... + # ###### Header 6 + # + $text =~ s{ + ^(\#{1,6}) # $1 = string of #'s + [ \t]* + (.+?) # $2 = Header text + [ \t]* + \#* # optional closing #'s (not counted) + \n+ + }{ + my $h_level = length($1); + $label = Header2Label($2); + $header = _RunSpanGamut($2); + + $g_crossrefs{$label} = "#$label"; + $g_titles{$label} = $header; + "" . $header . "\n\n"; + }egmx; + + # Can now process Wiki Links again + $g_temp_no_wikiwords = 0; + + return $text; +} + + +sub _DoLists { +# +# Form HTML ordered (numbered) and unordered (bulleted) lists. +# + my $text = shift; + my $less_than_tab = $g_tab_width - 1; + + # Re-usable patterns to match list item bullets and number markers: + my $marker_ul = qr/[*+-]/; + my $marker_ol = qr/\d+[.]/; + my $marker_any = qr/(?:$marker_ul|$marker_ol)/; + + # Re-usable pattern to match any entirel ul or ol list: + my $whole_list = qr{ + ( # $1 = whole list + ( # $2 + [ ]{0,$less_than_tab} + (${marker_any}) # $3 = first list item marker + [ \t]+ + ) + (?s:.+?) + ( # $4 + \z + | + \n{2,} + (?=\S) + (?! # Negative lookahead for another list item marker + [ \t]* + ${marker_any}[ \t]+ + ) + ) + ) + }mx; + + # We use a different prefix before nested lists than top-level lists. + # See extended comment in _ProcessListItems(). + # + # Note: There's a bit of duplication here. My original implementation + # created a scalar regex pattern as the conditional result of the test on + # $g_list_level, and then only ran the $text =~ s{...}{...}egmx + # substitution once, using the scalar as the pattern. This worked, + # everywhere except when running under MT on my hosting account at Pair + # Networks. There, this caused all rebuilds to be killed by the reaper (or + # perhaps they crashed, but that seems incredibly unlikely given that the + # same script on the same server ran fine *except* under MT. I've spent + # more time trying to figure out why this is happening than I'd like to + # admit. My only guess, backed up by the fact that this workaround works, + # is that Perl optimizes the substition when it can figure out that the + # pattern will never change, and when this optimization isn't on, we run + # afoul of the reaper. Thus, the slightly redundant code to that uses two + # static s/// patterns rather than one conditional pattern. + + if ($g_list_level) { + $text =~ s{ + ^ + $whole_list + }{ + my $list = $1; + my $list_type = ($3 =~ m/$marker_ul/) ? "ul" : "ol"; + # Turn double returns into triple returns, so that we can make a + # paragraph for the last item in a list, if necessary: + $list =~ s/\n{2,}/\n\n\n/g; + my $result = _ProcessListItems($list, $marker_any); + $result = "<$list_type>\n" . $result . "\n"; + $result; + }egmx; + } + else { + $text =~ s{ + (?:(?<=\n\n)|\A\n?) + $whole_list + }{ + my $list = $1; + my $list_type = ($3 =~ m/$marker_ul/) ? "ul" : "ol"; + # Turn double returns into triple returns, so that we can make a + # paragraph for the last item in a list, if necessary: + $list =~ s/\n{2,}/\n\n\n/g; + my $result = _ProcessListItems($list, $marker_any); + $result = "<$list_type>\n" . $result . "\n"; + $result; + }egmx; + } + + + return $text; +} + + +sub _ProcessListItems { +# +# Process the contents of a single ordered or unordered list, splitting it +# into individual list items. +# + + my $list_str = shift; + my $marker_any = shift; + + + # The $g_list_level global keeps track of when we're inside a list. + # Each time we enter a list, we increment it; when we leave a list, + # we decrement. If it's zero, we're not in a list anymore. + # + # We do this because when we're not inside a list, we want to treat + # something like this: + # + # I recommend upgrading to version + # 8. Oops, now this line is treated + # as a sub-list. + # + # As a single paragraph, despite the fact that the second line starts + # with a digit-period-space sequence. + # + # Whereas when we're inside a list (or sub-list), that line will be + # treated as the start of a sub-list. What a kludge, huh? This is + # an aspect of Markdown's syntax that's hard to parse perfectly + # without resorting to mind-reading. Perhaps the solution is to + # change the syntax rules such that sub-lists must start with a + # starting cardinal number; e.g. "1." or "a.". + + $g_list_level++; + + # trim trailing blank lines: + $list_str =~ s/\n{2,}\z/\n/; + + + $list_str =~ s{ + (\n)? # leading line = $1 + (^[ \t]*) # leading whitespace = $2 + ($marker_any) [ \t]+ # list marker = $3 + ((?s:.+?) # list item text = $4 + (\n{1,2})) + (?= \n* (\z | \2 ($marker_any) [ \t]+)) + }{ + my $item = $4; + my $leading_line = $1; + my $leading_space = $2; + + if ($leading_line or ($item =~ m/\n{2,}/)) { + $item = _RunBlockGamut(_Outdent($item)); + } + else { + # Recursion for sub-lists: + $item = _DoLists(_Outdent($item)); + chomp $item; + $item = _RunSpanGamut($item); + } + + "
  • " . $item . "
  • \n"; + }egmx; + + $g_list_level--; + return $list_str; +} + + + +sub _DoCodeBlocks { +# +# Process Markdown `
    ` blocks.
    +#	
    +
    +	my $text = shift;
    +
    +	$text =~ s{
    +			(?:\n\n|\A)
    +			(	            # $1 = the code block -- one or more lines, starting with a space/tab
    +			  (?:
    +			    (?:[ ]{$g_tab_width} | \t)  # Lines must start with a tab or a tab-width of spaces
    +			    .*\n+
    +			  )+
    +			)
    +			((?=^[ ]{0,$g_tab_width}\S)|\Z)	# Lookahead for non-space at line-start, or end of doc
    +		}{
    +			my $codeblock = $1;
    +			my $result; # return value
    +
    +			$codeblock = _EncodeCode(_Outdent($codeblock));
    +			$codeblock = _Detab($codeblock);
    +			$codeblock =~ s/\A\n+//; # trim leading newlines
    +			$codeblock =~ s/\s+\z//; # trim trailing whitespace
    +
    +			$result = "\n\n
    " . $codeblock . "\n
    \n\n"; + + $result; + }egmx; + + return $text; +} + + +sub _DoCodeSpans { +# +# * Backtick quotes are used for spans. +# +# * You can use multiple backticks as the delimiters if you want to +# include literal backticks in the code span. So, this input: +# +# Just type ``foo `bar` baz`` at the prompt. +# +# Will translate to: +# +#

    Just type foo `bar` baz at the prompt.

    +# +# There's no arbitrary limit to the number of backticks you +# can use as delimters. If you need three consecutive backticks +# in your code, use four for delimiters, etc. +# +# * You can use spaces to get literal backticks at the edges: +# +# ... type `` `bar` `` ... +# +# Turns to: +# +# ... type `bar` ... +# + + my $text = shift; + + $text =~ s@ + (`+) # $1 = Opening run of ` + (.+?) # $2 = The code block + (?$c
    "; + @egsx; + + return $text; +} + + +sub _EncodeCode { +# +# Encode/escape certain characters inside Markdown code runs. +# The point is that in code, these characters are literals, +# and lose their special Markdown meanings. +# + local $_ = shift; + + # Protect Wiki Links in Code Blocks + if ($g_use_wiki_links) { + my $WikiWord = '[A-Z]+[a-z\x80-\xff]+[A-Z][A-Za-z\x80-\xff]*'; + s/($WikiWord)/\\$1/gx; + } + + # Encode all ampersands; HTML entities are not + # entities within a Markdown code span. + s/&/&/g; + + # Encode $'s, but only if we're running under Blosxom. + # (Blosxom interpolates Perl variables in article bodies.) + { + no warnings 'once'; + if (defined($blosxom::version)) { + s/\$/$/g; + } + } + + + # Do the angle bracket song and dance: + s! < !<!gx; + s! > !>!gx; + + # Now, escape characters that are magic in Markdown: + s! \* !$g_escape_table{'*'}!gx; + s! _ !$g_escape_table{'_'}!gx; + s! { !$g_escape_table{'{'}!gx; + s! } !$g_escape_table{'}'}!gx; + s! \[ !$g_escape_table{'['}!gx; + s! \] !$g_escape_table{']'}!gx; + s! \\ !$g_escape_table{'\\'}!gx; + + return $_; +} + + +sub _DoItalicsAndBold { + my $text = shift; + + # Handle at beginning of lines: + $text =~ s{ ^(\*\*|__) (?=\S) (.+?[*_]*) (?<=\S) \1 } + {$2}gsx; + + $text =~ s{ ^(\*|_) (?=\S) (.+?) (?<=\S) \1 } + {$2}gsx; + + # must go first: + $text =~ s{ (?<=\W) (\*\*|__) (?=\S) (.+?[*_]*) (?<=\S) \1 } + {$2}gsx; + + $text =~ s{ (?<=\W) (\*|_) (?=\S) (.+?) (?<=\S) \1 } + {$2}gsx; + + # And now, a second pass to catch nested strong and emphasis special cases + $text =~ s{ (?<=\W) (\*\*|__) (?=\S) (.+?[*_]*) (?<=\S) \1 } + {$2}gsx; + + $text =~ s{ (?<=\W) (\*|_) (?=\S) (.+?) (?<=\S) \1 } + {$2}gsx; + + return $text; +} + + +sub _DoBlockQuotes { + my $text = shift; + + $text =~ s{ + ( # Wrap whole match in $1 + ( + ^[ \t]*>[ \t]? # '>' at the start of a line + .+\n # rest of the first line + (.+\n)* # subsequent consecutive lines + \n* # blanks + )+ + ) + }{ + my $bq = $1; + $bq =~ s/^[ \t]*>[ \t]?//gm; # trim one level of quoting + $bq =~ s/^[ \t]+$//mg; # trim whitespace-only lines + $bq = _RunBlockGamut($bq); # recurse + + $bq =~ s/^/ /g; + # These leading spaces screw with
     content, so we need to fix that:
    +			$bq =~ s{
    +					(\s*
    .+?
    ) + }{ + my $pre = $1; + $pre =~ s/^ //mg; + $pre; + }egsx; + + "
    \n$bq\n
    \n\n"; + }egmx; + + + return $text; +} + + +sub _FormParagraphs { +# +# Params: +# $text - string to process with html

    tags +# + my $text = shift; + + # Strip leading and trailing lines: + $text =~ s/\A\n+//; + $text =~ s/\n+\z//; + + my @grafs = split(/\n{2,}/, $text); + + # + # Wrap

    tags. + # + foreach (@grafs) { + unless (defined( $g_html_blocks{$_} )) { + $_ = _RunSpanGamut($_); + s/^([ \t]*)/

    /; + $_ .= "

    "; + } + } + + # + # Unhashify HTML blocks + # + foreach (@grafs) { + if (defined( $g_html_blocks{$_} )) { + $_ = $g_html_blocks{$_}; + } + } + + return join "\n\n", @grafs; +} + + +sub _EncodeAmpsAndAngles { +# Smart processing for ampersands and angle brackets that need to be encoded. + + my $text = shift; + + # Ampersand-encoding based entirely on Nat Irons's Amputator MT plugin: + # http://bumppo.net/projects/amputator/ + $text =~ s/&(?!#?[xX]?(?:[0-9a-fA-F]+|\w+);)/&/g; + + # Encode naked <'s + $text =~ s{<(?![a-z/?\$!])}{<}gi; + + # And >'s - added by Fletcher Penney +# $text =~ s{>(?![a-z/?\$!])}{>}gi; +# Causes problems... + + return $text; +} + + +sub _EncodeBackslashEscapes { +# +# Parameter: String. +# Returns: The string, with after processing the following backslash +# escape sequences. +# + local $_ = shift; + + s! \\\\ !$g_escape_table{'\\'}!gx; # Must process escaped backslashes first. + s! \\` !$g_escape_table{'`'}!gx; + s! \\\* !$g_escape_table{'*'}!gx; + s! \\_ !$g_escape_table{'_'}!gx; + s! \\\{ !$g_escape_table{'{'}!gx; + s! \\\} !$g_escape_table{'}'}!gx; + s! \\\[ !$g_escape_table{'['}!gx; + s! \\\] !$g_escape_table{']'}!gx; + s! \\\( !$g_escape_table{'('}!gx; + s! \\\) !$g_escape_table{')'}!gx; + s! \\> !$g_escape_table{'>'}!gx; + s! \\\# !$g_escape_table{'#'}!gx; + s! \\\+ !$g_escape_table{'+'}!gx; + s! \\\- !$g_escape_table{'-'}!gx; + s! \\\. !$g_escape_table{'.'}!gx; + s{ \\! }{$g_escape_table{'!'}}gx; + + return $_; +} + + +sub _DoAutoLinks { + my $text = shift; + + $text =~ s{<((https?|ftp):[^'">\s]+)>}{
    $1}gi; + + # Email addresses: + $text =~ s{ + < + (?:mailto:)? + ( + [-.\w]+ + \@ + [-a-z0-9]+(\.[-a-z0-9]+)*\.[a-z]+ + ) + > + }{ + _EncodeEmailAddress( _UnescapeSpecialChars($1) ); + }egix; + + return $text; +} + + +sub _EncodeEmailAddress { +# +# Input: an email address, e.g. "foo@example.com" +# +# Output: the email address as a mailto link, with each character +# of the address encoded as either a decimal or hex entity, in +# the hopes of foiling most address harvesting spam bots. E.g.: +# +# foo +# @example.com +# +# Based on a filter by Matthew Wickline, posted to the BBEdit-Talk +# mailing list: +# + + my $addr = shift; + + srand; + my @encode = ( + sub { '&#' . ord(shift) . ';' }, + sub { '&#x' . sprintf( "%X", ord(shift) ) . ';' }, + sub { shift }, + ); + + $addr = "mailto:" . $addr; + + $addr =~ s{(.)}{ + my $char = $1; + if ( $char eq '@' ) { + # this *must* be encoded. I insist. + $char = $encode[int rand 1]->($char); + } elsif ( $char ne ':' ) { + # leave ':' alone (to spot mailto: later) + my $r = rand; + # roughly 10% raw, 45% hex, 45% dec + $char = ( + $r > .9 ? $encode[2]->($char) : + $r < .45 ? $encode[1]->($char) : + $encode[0]->($char) + ); + } + $char; + }gex; + + $addr = qq{$addr}; + $addr =~ s{">.+?:}{">}; # strip the mailto: from the visible part + + return $addr; +} + + +sub _UnescapeSpecialChars { +# +# Swap back in all the special characters we've hidden. +# + my $text = shift; + + while( my($char, $hash) = each(%g_escape_table) ) { + $text =~ s/$hash/$char/g; + } + return $text; +} + + +sub _TokenizeHTML { +# +# Parameter: String containing HTML markup. +# Returns: Reference to an array of the tokens comprising the input +# string. Each token is either a tag (possibly with nested, +# tags contained therein, such as , or a +# run of text between tags. Each element of the array is a +# two-element array; the first is either 'tag' or 'text'; +# the second is the actual value. +# +# +# Derived from the _tokenize() subroutine from Brad Choate's MTRegex plugin. +# +# + + my $str = shift; + my $pos = 0; + my $len = length $str; + my @tokens; + + my $depth = 6; + my $nested_tags = join('|', ('(?:<[a-z/!$](?:[^<>]') x $depth) . (')*>)' x $depth); + my $match = qr/(?s: ) | # comment + (?s: <\? .*? \?> ) | # processing instruction + $nested_tags/ix; # nested tags + + while ($str =~ m/($match)/g) { + my $whole_tag = $1; + my $sec_start = pos $str; + my $tag_start = $sec_start - length $whole_tag; + if ($pos < $tag_start) { + push @tokens, ['text', substr($str, $pos, $tag_start - $pos)]; + } + push @tokens, ['tag', $whole_tag]; + $pos = pos $str; + } + push @tokens, ['text', substr($str, $pos, $len - $pos)] if $pos < $len; + \@tokens; +} + + +sub _Outdent { +# +# Remove one level of line-leading tabs or spaces +# + my $text = shift; + + $text =~ s/^(\t|[ ]{1,$g_tab_width})//gm; + return $text; +} + + +sub _Detab { +# +# Cribbed from a post by Bart Lateur: +# +# + my $text = shift; + + $text =~ s{(.*?)\t}{$1.(' ' x ($g_tab_width - length($1) % $g_tab_width))}ge; + return $text; +} + +# +# MultiMarkdown Routines +# + +sub _ParseMetaData { + my $text = shift; + my $clean_text = ""; + + my ($inMetaData, $currentKey) = (1,''); + + foreach my $line ( split /\n/, $text ) { + $line =~ /^$/ and $inMetaData = 0 and $clean_text .= $line and next; + if ($inMetaData) { + if ($line =~ /^([a-zA-Z0-9][0-9a-zA-Z ]+?):\s*(.*)$/ ) { + $currentKey = $1; + $currentKey =~ s/ / /g; + $g_metadata{$currentKey} = $2; + if (lc($currentKey) eq "format") { + $g_document_format = lc($g_metadata{$currentKey}); + } + if (lc($currentKey) eq "base url") { + $g_base_url = $g_metadata{$currentKey}; + } + if (lc($currentKey) eq "use wikilinks") { + if (lc($g_metadata{$currentKey}) eq "true" || + $g_metadata{$currentKey} eq "1") { + $g_use_wiki_links = 1; + } + } + if (!$g_metadata_newline{$currentKey}) { + $g_metadata_newline{$currentKey} = $g_metadata_newline{default}; + } + } else { + if ($currentKey eq "") { + # No metadata present + $clean_text .= "$line\n"; + $inMetaData = 0; + next; + } + if ($line =~ /^\s*(.+)$/ ) { + $g_metadata{$currentKey} .= "$g_metadata_newline{$currentKey}$1"; + } + } + } else { + $clean_text .= "$line\n"; + } + } + + return $clean_text; +} + +sub _StripFootnoteDefinitions { + my $text = shift; + my $less_than_tab = $g_tab_width - 1; + + while ($text =~ s{ + \n\[\^(.+?)\]:[ \t]*# id = $1 + \n? + (.*?)\n{1,2} # end at new paragraph + ((?=\n[ ]{0,$less_than_tab}\S)|\Z) # Lookahead for non-space at line-start, or end of doc + } + {\n}sx) + { + my $id = $1; + my $footnote = "$2\n"; + $footnote =~ s/^[ ]{0,$g_tab_width}//gm; + + $footnote = _RunBlockGamut($footnote); + + # strip leading

    tag (it will be added later) + $footnote =~ s/^\//s; + + $g_footnotes{Header2Label($id)} = $footnote; + } + + return $text; +} + +sub _DoFootnotes { + my $text = shift; + + $text =~ s{ + \[\^(.*?)\] # id = $1 + }{ + my $result; + my $id = Header2Label($1); + + if (defined $g_footnotes{$id} ) { +# $result = "$g_footnotes{Header2Label($id)}" + $g_footnote_counter++; + $result = "$g_footnote_counter"; + push (@g_used_footnotes,$id); + } + $result; + }xsge; + + return $text; +} + +sub _FixFootnoteParagraphs { + my $text = shift; + + $text =~ s/^\\<\/footnote\>/<\/footnote>/gm; + + return $text; +} + +sub _PrintFootnotes{ + my $footnote_counter = 0; + my $result; + + foreach my $id (@g_used_footnotes) { + $footnote_counter++; + $result.="

    $footnote_counter. $g_footnotes{$id}

    \n\n"; + } + $result .= ""; + + if ($footnote_counter > 0) { + $result = "\n\n
    \nFootnotes:

    \n\n".$result; + } else { + $result = ""; + } + + return $result; +} + +sub Header2Label { + my $header = shift; + my $label = lc $header; + $label =~ s/[^A-Za-z0-9:_.-]//g; # Strip illegal characters + $label =~ s/^[^A-Za-z]//g; # Strip illegal leading characters + return $label; +} + +sub xhtmlMetaData { + my $result = qq{\n}; + + # This screws up xsltproc - make sure to use `-nonet -novalid` if you + # have difficulty + $result .= qq{\n}; + + $result.= "\n\t\n"; + + foreach my $key (sort keys %g_metadata ) { + if (lc($key) eq "title") { + $result.= "\t\t$g_metadata{$key}\n"; + } elsif (lc($key) eq "css") { + $result.= "\t\t\n/g; + + if ($result ne "") { + $result.= "\n"; + } + + return $result; +} + +sub _ConvertCopyright{ + my $text = shift; + # Convert to an XML compatible form of copyright symbol + + $text =~ s/©/©/gi; + + return $text; +} + +sub _CreateWikiLink { + my $title = shift; + + my $id = $title; + $id =~ s/ /_/g; + $id =~ s/__+/_/g; + $id =~ s/^_//g; + $id =~ s/_$//; + + $title =~ s/_/ /g; + + return "[$title]($g_base_url$id)"; +} + +sub _DoWikiLinks { + + my $text = shift; + my $WikiWord = '[A-Z]+[a-z\x80-\xff]+[A-Z][A-Za-z\x80-\xff]*'; + my $FreeLinkPattern = "([-,.()' _0-9A-Za-z\x80-\xff]+)"; + + if ($g_use_wiki_links) { + # FreeLinks + $text =~ s{ + \[\[($FreeLinkPattern)\]\] + }{ + my $label = $1; + $label =~ s{ + ([\s\>])($WikiWord) + }{ + $1 ."\\" . $2 + }xsge; + + _CreateWikiLink($label) + }xsge; + } + + # WikiWords + if ($g_use_wiki_links) { + $text =~ s{ + ([\s])($WikiWord) + }{ + $1 . _CreateWikiLink($2) + }xsge; + + # Catch WikiWords at beginning of text + $text =~ s{^($WikiWord) + }{ + _CreateWikiLink($1) + }xse; + } + + + return $text; +} + +sub _UnescapeWikiWords { + my $text = shift; + my $WikiWord = '[A-Z]+[a-z\x80-\xff]+[A-Z][A-Za-z\x80-\xff]*'; + + # Unescape escaped WikiWords + $text =~ s/\\($WikiWord)/$1/g; + + return $text; +} + + +sub _DoTables { + my $text = shift; + my $less_than_tab = $g_tab_width - 1; + + # Algorithm inspired by PHP Markdown Extra's + # + + # Reusable regexp's to match table + + my $line_start = qr{ + [ ]{0,$less_than_tab} + }mx; + + my $table_row = qr{ + [^\n]*?\|[^\n]*?\n + }mx; + + my $first_row = qr{ + $line_start + \S+.*?\|.*?\n + }mx; + + my $table_rows = qr{ + (\n?$table_row) + }mx; + + my $table_caption = qr{ + $line_start + \[.*?\][ \t]*\n + }mx; + + my $table_divider = qr{ + $line_start + [\|\-\:\.][ \-\|\:\.]* \| [ \-\|\:\.]* + }mx; + + my $whole_table = qr{ + ($table_caption)? # Optional caption + ($first_row # First line must start at beginning + ($table_row)*?)? # Header Rows + $table_divider # Divider/Alignment definitions + $table_rows+ # Body Rows + ($table_caption)? # Optional caption + }mx; + + + # Find whole tables, then break them up and process them + + $text =~ s{ + ^($whole_table) # Whole table in $1 + (\n|\Z) # End of file or 2 blank lines + }{ + my $table = $1; + my $result = "\n"; + my @alignments; + my $use_row_header = 0; + + # Add Caption, if present + + if ($table =~ s/^$line_start\[\s*(.*?)\s*\](\[\s*(.*?)\s*\])?[ \t]*$//m) { + if (defined $3) { + $result .= "\n"; + + # add caption id to cross-ref list + $g_crossrefs{$3} = "#$3"; + $g_titles{$3} = "$1"; + } else { + $result .= "\n"; + } + } + + # If a second "caption" is present, treat it as a summary + # However, this is not valid in XHTML 1.0 Stric + # But maybe in future + + # A summary might be longer than one line + if ($table =~ s/\n$line_start\[\s*(.*?)\s*\][ \t]*\n/\n/s) { + # $result .= "" . _RunSpanGamut($1) . "\n"; + } + + # Now, divide table into header, alignment, and body + + # First, add leading \n in case there is no header + + $table = "\n" . $table; + + # Need to be greedy + + $table =~ s/\n($table_divider)\n(($table_rows)+)//s; + + my $alignment_string = $1; + my $body = $2; + + # Process column alignment + while ($alignment_string =~ /\|?\s*(.+?)\s*(\||\Z)/gs) { + my $cell = _RunSpanGamut($1); + if ($cell =~ /\:$/) { + if ($cell =~ /^\:/) { + $result .= "$cell\n"; + } else { + $result .= "\t<$cell_type$colspan>$cell\n"; + } + $count++; + } + $result .= "\n"; + } + + $result .= "\n
    " . _RunSpanGamut($1). "" . _RunSpanGamut($1). "
    \n"; + $result + }egmx; + + my $table_body = qr{ + ( # wrap whole match in $2 + + (.*?\|.*?)\n # wrap headers in $3 + + [ ]{0,$less_than_tab} + ($table_divider) # alignment in $4 + + ( # wrap cells in $5 + $table_rows + ) + ) + }mx; + + return $text; +} + + +sub _DoAttributes{ + my $id = shift; + my $result = ""; + + if (defined $g_attributes{$id}) { + while ($g_attributes{$id} =~ s/(\S+)="(.*?)"//g) { + $result .= " $1=\"$2\""; + } + while ($g_attributes{$id} =~ /(\S+)=(\S+)/g) { + $result .= " $1=\"$2\""; + } + } + + return $result; +} + + +sub _StripMarkdownReferences { + my $text = shift; + my $less_than_tab = $g_tab_width - 1; + + while ($text =~ s{ + \n\[\#(.+?)\]:[ \t]* # id = $1 + \n? + (.*?)\n{1,2} # end at new paragraph + ((?=\n[ ]{0,$less_than_tab}\S)|\Z) # Lookahead for non-space at line-start, or end of doc + } + {\n}sx) + { + my $id = $1; + my $reference = "$2\n"; + + $reference =~ s/^[ ]{0,$g_tab_width}//gm; + + $reference = _RunBlockGamut($reference); + + # strip leading and trailing

    tags (they will be added later) + $reference =~ s/^\//s; + $reference =~ s/\<\/p\>\s*$//s; + + $g_references{$id} = $reference; + } + + return $text; +} + +sub _DoMarkdownCitations { + my $text = shift; + + $text =~ s{ + \[([^\[]*?)\] # citation text = $1 + [ ]? # one optional space + (?:\n[ ]*)? # one optional newline followed by spaces + \[\#(.*?)\] # id = $2 + }{ + my $result; + my $anchor_text = $1; + my $id = $2; + my $count; + + if (defined $g_references{$id} ) { + my $citation_counter=0; + + # See if citation has been used before + foreach my $old_id (@g_used_references) { + $citation_counter++; + $count = $citation_counter if ($old_id eq $id); + } + + if (! defined $count) { + $g_citation_counter++; + $count = $g_citation_counter; + push (@g_used_references,$id); + } + + $result = " ($count"; + + if ($anchor_text ne "") { + $result .=", $anchor_text"; + } + + $result .= ")"; + } else { + # No reference exists + $result = " ($id"; + + if ($anchor_text ne "") { + $result .=", $anchor_text"; + } + + $result .= ")"; + } + + if (Header2Label($anchor_text) eq "notcited"){ + $result = ""; + } + $result; + }xsge; + + return $text; + +} + +sub _PrintMarkdownBibliography{ + my $citation_counter = 0; + my $result; + + foreach my $id (@g_used_references) { + $citation_counter++; + $result.="

    [$citation_counter] $g_references{$id}

    \n\n"; + } + $result .= "
    "; + + if ($citation_counter > 0) { + $result = "\n\n
    \nBibliography

    \n\n".$result; + } else { + $result = ""; + } + + return $result; +} + + +1; +__END__ + +=pod + +=head1 NAME + +B + + +=head1 SYNOPSIS + +B [ B<--html4tags> ] [ B<--version> ] [ B<-shortversion> ] + [ I ... ] + + +=head1 DESCRIPTION + +Markdown is a text-to-HTML filter; it translates an easy-to-read / +easy-to-write structured text format into HTML. Markdown's text format +is most similar to that of plain text email, and supports features such +as headers, *emphasis*, code blocks, blockquotes, and links. + +Markdown's syntax is designed not as a generic markup language, but +specifically to serve as a front-end to (X)HTML. You can use span-level +HTML tags anywhere in a Markdown document, and you can use block level +HTML tags (like
    and as well). + +For more information about Markdown's syntax, see: + + http://daringfireball.net/projects/markdown/ + + +=head1 OPTIONS + +Use "--" to end switch parsing. For example, to open a file named "-z", use: + + Markdown.pl -- -z + +=over 4 + + +=item B<--html4tags> + +Use HTML 4 style for empty element tags, e.g.: + +
    + +instead of Markdown's default XHTML style tags, e.g.: + +
    + + +=item B<-v>, B<--version> + +Display Markdown's version number and copyright information. + + +=item B<-s>, B<--shortversion> + +Display the short-form version number. + +=back + + + +=head1 BUGS + +To file bug reports or feature requests (other than topics listed in the +Caveats section above) please send email to: + + support@daringfireball.net (for Markdown issues) + + fletcher@freeshell.org (for MultiMarkdown issues) + +Please include with your report: (1) the example input; (2) the output +you expected; (3) the output Markdown actually produced. + + +=head1 VERSION HISTORY + +See the readme file for detailed release notes for this version. + +1.0.1 - 14 Dec 2004 + +1.0 - 28 Aug 2004 + + +=head1 AUTHOR + + John Gruber + http://daringfireball.net/ + + PHP port and other contributions by Michel Fortin + http://michelf.com/ + + MultiMarkdown changes by Fletcher Penney + http://fletcher.freeshell.org/ + +=head1 COPYRIGHT AND LICENSE + +Original Code Copyright (c) 2003-2004 John Gruber + +All rights reserved. + +MultiMarkdown changes Copyright (c) 2005-2006 Fletcher T. Penney + +All rights reserved. + +Redistribution and use in source and binary forms, with or without +modification, are permitted provided that the following conditions are +met: + +* Redistributions of source code must retain the above copyright notice, + this list of conditions and the following disclaimer. + +* Redistributions in binary form must reproduce the above copyright + notice, this list of conditions and the following disclaimer in the + documentation and/or other materials provided with the distribution. + +* Neither the name "Markdown" nor the names of its contributors may + be used to endorse or promote products derived from this software + without specific prior written permission. + +This software is provided by the copyright holders and contributors "as +is" and any express or implied warranties, including, but not limited +to, the implied warranties of merchantability and fitness for a +particular purpose are disclaimed. In no event shall the copyright owner +or contributors be liable for any direct, indirect, incidental, special, +exemplary, or consequential damages (including, but not limited to, +procurement of substitute goods or services; loss of use, data, or +profits; or business interruption) however caused and on any theory of +liability, whether in contract, strict liability, or tort (including +negligence or otherwise) arising in any way out of the use of this +software, even if advised of the possibility of such damage. + +=cut diff --git a/Support/help.markdown b/Support/help.markdown new file mode 100644 index 0000000..00042f7 --- /dev/null +++ b/Support/help.markdown @@ -0,0 +1,55 @@ +# Setup + +You will need a TextMate Project (a Scratch Project will do) to make this work. + +## Structure + +The following files & folders are needed: + +* `pages` + + This is where all your markdown files go. You need to make a new file for each chapter. It should have one first level heading which will be used for the name of the chapter (in the Table of Contents, for the Navigational Links & in the HTML title). + The files in the `pages` directory are converted to HTML (using Markdown and SmartyPants) with the _Generate_ Command. They have to be in the right order, so they have to be named beginning with numbers followed by a space or an underscore (as seen in the included example). This prefix will be stripped by the Generate Script. + +* `html` + + The generated files will go here. + + * `index.html`: Table of Contents from which you can navigate to all chapter. + * `all_pages.html`: A single files with all chapters. This is mainly for printing and it uses the `print.css` Stylesheet. + * `*.html`: Every chapter has it's own file. + + Also this folder holds two links to the css and images folder. When "deploying" your compiled book, just replace these by the actual folders. + + +* `templates` + + This folder contains three html templates. Adapt them to your needs. + + * `all.rhtml`: template for the `all_pages.html` file which contains all your chapters. + * `chapter.html`: template for each chapter + * `toc.html`: template for the `index.html` file containing the Table of Contents + +* `css` + + This folder contains the stylesheets (`stylesheet.css` and `print.css`). Adapt those as you like. The default style resembles the [TextMate Manual](http://macromates.com/textmate/manual/). + +* `images` + + This folder should hold all your images. When the book is generated `height` and `width` HTML attributes are added to the images. The source path could be changed, too, to make it absolute. + + + +## References + +You can use reference style links (`[link description][link id]`) in your text. There is a command _Update References_ that will collect them from all `.markdown` files in the `pages` folder and write them to a file `markdown.references` in the project root. It notifies you of missing or duplicate entries via a Tooltip. You can then edit this file and insert the link targets within your text. The _Generate_ Script will add `id` attributes to your headings, so you can reference them directly. Is converts some characters (`- \/_`) to underscores and strips non-alphanumeric characters afterwards. + +I wrote a command _Show References_ that brings up a dialog with all the references from the `markdown.references` file and inserts a reference snippet. + +## Generation process + +The _Generate_ Command is a Ruby Script, which does some transformation, constructs the Table of Contents and runs all your Markdown files through [Markdown](http://daringfireball.net/projects/markdown/), [SmartyPants](http://daringfireball.net/projects/smartypants/) (for good Typography) and the Image-Script. + +
    + +> Credits to Allan for writing the initial version of all this. I, Soryu, bundled it up in a TextMate bundle and added/polished some stuff. diff --git a/info.plist b/info.plist new file mode 100644 index 0000000..a340630 --- /dev/null +++ b/info.plist @@ -0,0 +1,18 @@ + + + + + name + Markdown2Book + ordering + + C445442D-06BF-4CEE-A642-6209B84632A6 + 749EA16A-700B-43B3-9457-FA12D8301CAE + 3E0EDBF3-2018-46EA-95EE-C4EB20118789 + B3AF90C8-A1B0-4583-A5E4-74374B68B015 + B9B57AA0-0024-41F6-B6AE-C60FCDC1E8B1 + + uuid + FE3F62A4-6416-478F-957F-F17BECA563F6 + +