` blocks. # global $md_tab_width; $text = preg_replace_callback("{ (?:\\n\\n|\\A) ( # $1 = the code block -- one or more lines, starting with a space/tab (?: (?:[ ]\{$md_tab_width} | \\t) # Lines must start with a tab or a tab-width of spaces .*\\n+ )+ ) ((?=^[ ]{0,$md_tab_width}\\S)|\\Z) # Lookahead for non-space at line-start, or end of doc }xm", '_DoCodeBlocks_callback', $text); return $text; } function _DoCodeBlocks_callback($matches) { $codeblock = $matches[1]; $codeblock = _EncodeCode(_Outdent($codeblock)); $codeblock = _Detab($codeblock); # trim leading newlines and trailing whitespace $codeblock = preg_replace(array('/\A\n+/', '/\s+\z/'), '', $codeblock); $result = "\n\n" . $codeblock . "\n\n\n"; return $result; } function _DoCodeSpans($text) { # # * Backtick quotes are used for spans. # # * You can use multiple backticks as the delimiters if you want to # include literal backticks in the code span. So, this input: # # Just type ``foo `bar` baz`` at the prompt. # # Will translate to: # # Just type foo `bar` baz at the prompt. # # There's no arbitrary limit to the number of backticks you # can use as delimters. If you need three consecutive backticks # in your code, use four for delimiters, etc. # # * You can use spaces to get literal backticks at the edges: # # ... type `` `bar` `` ... # # Turns to: # # ... type `bar` ... # $text = preg_replace_callback("@ (`+) # $1 = Opening run of ` (.+?) # $2 = The code block (?$c"; } function _EncodeCode($_) { # # Encode/escape certain characters inside Markdown code runs. # The point is that in code, these characters are literals, # and lose their special Markdown meanings. # global $md_escape_table; # Encode all ampersands; HTML entities are not # entities within a Markdown code span. $_ = str_replace('&', '&', $_); # Do the angle bracket song and dance: $_ = str_replace(array('<', '>'), array('<', '>'), $_); # Now, escape characters that are magic in Markdown: $_ = str_replace(array_keys($md_escape_table), array_values($md_escape_table), $_); return $_; } function _DoItalicsAndBold($text) { # must go first: $text = preg_replace('{ (\*\*|__) (?=\S) (.+?) (?<=\S) \1 }sx', '\2', $text); # Then : $text = preg_replace('{ (\*|_) (?=\S) (.+?) (?<=\S) \1 }sx', '\2', $text); return $text; } function _DoBlockQuotes($text) { $text = preg_replace_callback('/ ( # Wrap whole match in $1 ( ^[ \t]*>[ \t]? # ">" at the start of a line .+\n # rest of the first line (.+\n)* # subsequent consecutive lines \n* # blanks )+ ) /xm', '_DoBlockQuotes_callback', $text); return $text; } function _DoBlockQuotes_callback($matches) { $bq = $matches[1]; # trim one level of quoting - trim whitespace-only lines $bq = preg_replace(array('/^[ \t]*>[ \t]?/m', '/^[ \t]+$/m'), '', $bq); $bq = _RunBlockGamut($bq); # recurse $bq = preg_replace('/^/m', " ", $bq); # These leading spaces screw with content, so we need to fix that: $bq = preg_replace_callback('{(\s*
.+?
)}sx', '_DoBlockQuotes_callback2', $bq); return "
\n$bq\n
\n\n"; } function _DoBlockQuotes_callback2($matches) { $pre = $matches[1]; $pre = preg_replace('/^ /m', '', $pre); return $pre; } function _FormParagraphs($text) { # # Params: # $text - string to process with html
tags # global $md_html_blocks; # Strip leading and trailing lines: $text = preg_replace(array('/\A\n+/', '/\n+\z/'), '', $text); $grafs = preg_split('/\n{2,}/', $text, -1, PREG_SPLIT_NO_EMPTY); $count = count($grafs); # # Wrap
tags. # foreach ($grafs as $key => $value) { if (!isset( $md_html_blocks[$value] )) { $value = _RunSpanGamut($value); $value = preg_replace('/^([ \t]*)/', '
', $value); $value .= "
"; $grafs[$key] = $value; } } # # Unhashify HTML blocks # foreach ($grafs as $key => $value) { if (isset( $md_html_blocks[$value] )) { $grafs[$key] = $md_html_blocks[$value]; } } return implode("\n\n", $grafs); } function _EncodeAmpsAndAngles($text) { # Smart processing for ampersands and angle brackets that need to be encoded. # Ampersand-encoding based entirely on Nat Irons's Amputator MT plugin: # http://bumppo.net/projects/amputator/ $text = preg_replace('/&(?!#?[xX]?(?:[0-9a-fA-F]+|\w+);)/', '&', $text);; # Encode naked <'s $text = preg_replace('{<(?![a-z/?\$!])}i', '<', $text); return $text; } function _EncodeBackslashEscapes($text) { # # Parameter: String. # Returns: The string, with after processing the following backslash # escape sequences. # global $md_escape_table, $md_backslash_escape_table; # Must process escaped backslashes first. return str_replace(array_keys($md_backslash_escape_table), array_values($md_backslash_escape_table), $text); } function _DoAutoLinks($text) { $text = preg_replace("!<((https?|ftp):[^'\">\\s]+)>!", '\1', $text); # Email addresses: $text = preg_replace('{ < ( [-.\w]+ \@ [-a-z0-9]+(\.[-a-z0-9]+)*\.[a-z]+ ) > }exi', "_EncodeEmailAddress(_UnescapeSpecialChars(_UnslashQuotes('\\1')))", $text); return $text; } function _EncodeEmailAddress($addr) { # # Input: an email address, e.g. "foo@example.com" # # Output: the email address as a mailto link, with each character # of the address encoded as either a decimal or hex entity, in # the hopes of foiling most address harvesting spam bots. E.g.: # # foo # @example.com # # Based by a filter by Matthew Wickline, posted to the BBEdit-Talk # mailing list: # $addr = "mailto:" . $addr; $length = strlen($addr); # leave ':' alone (to spot mailto: later) $addr = preg_replace_callback('/([^\:])/', '_EncodeEmailAddress_callback', $addr); $addr = "$addr"; # strip the mailto: from the visible part $addr = preg_replace('/">.+?:/', '">', $addr); return $addr; } function _EncodeEmailAddress_callback($matches) { $char = $matches[1]; $r = rand(0, 100); # roughly 10% raw, 45% hex, 45% dec # '@' *must* be encoded. I insist. if ($r > 90 && $char != '@') return $char; if ($r < 45) return '&#x'.dechex(ord($char)).';'; return '&#'.ord($char).';'; } function _UnescapeSpecialChars($text) { # # Swap back in all the special characters we've hidden. # global $md_escape_table; return str_replace(array_values($md_escape_table), array_keys($md_escape_table), $text); } # Tokenize_HTML is shared between PHP Markdown and PHP SmartyPants. # We only define it if it is not already defined. if (!function_exists('_TokenizeHTML')) { function _TokenizeHTML($str) { # # Parameter: String containing HTML markup. # Returns: An array of the tokens comprising the input # string. Each token is either a tag (possibly with nested, # tags contained therein, such as , or a # run of text between tags. Each element of the array is a # two-element array; the first is either 'tag' or 'text'; # the second is the actual value. # # # Regular expression derived from the _tokenize() subroutine in # Brad Choate's MTRegex plugin. # # $index = 0; $tokens = array(); $depth = 6; $nested_tags = str_repeat('(?:<[a-z\/!$](?:[^<>]|',$depth) .str_repeat(')*>)', $depth); $match = "(?s:)|". # comment "(?s:<\?.*?\?>)|". # processing instruction "$nested_tags"; # nested tags $parts = preg_split("/($match)/", $str, -1, PREG_SPLIT_DELIM_CAPTURE); foreach ($parts as $part) { if (++$index % 2 && $part != '') array_push($tokens, array('text', $part)); else array_push($tokens, array('tag', $part)); } return $tokens; } } function _Outdent($text) { # # Remove one level of line-leading tabs or spaces # global $md_tab_width; return preg_replace("/^(\\t|[ ]{1,$md_tab_width})/m", "", $text); } function _Detab($text) { # # Inspired from a post by Bart Lateur: # # global $md_tab_width; $text = preg_replace( "/(.*?)\t/e", "'\\1'.str_repeat(' ', $md_tab_width - strlen('\\1') % $md_tab_width)", $text); return $text; } function _UnslashQuotes($text) { # # This function is useful to remove automaticaly slashed double quotes # when using preg_replace and evaluating an expression. # Parameter: String. # Returns: The string with any slash-double-quote (\") sequence replaced # by a single double quote. # return str_replace('\"', '"', $text); } /* PHP Markdown ============ Description ----------- This is a PHP translation of the original Markdown formatter written in Perl by John Gruber. Markdown is a text-to-HTML filter; it translates an easy-to-read / easy-to-write structured text format into HTML. Markdown's text format is most similar to that of plain text email, and supports features such as headers, *emphasis*, code blocks, blockquotes, and links. Markdown's syntax is designed not as a generic markup language, but specifically to serve as a front-end to (X)HTML. You can use span-level HTML tags anywhere in a Markdown document, and you can use block level HTML tags (like
and as well). For more information about Markdown's syntax, see: Bugs ---- To file bug reports please send email to: Please include with your report: (1) the example input; (2) the output you expected; (3) the output Markdown actually produced. Version History --------------- 1.0: Sat 21 Aug 2004 * Fixed a couple of bugs in _DoLists() and _ProcessListItems() that caused unordered lists starting with `+` or `-` to be turned into *ordered* lists. * Added to the list of block-level HTML tags: noscript, form, fieldset, iframe, math * Fixed an odd bug where, with input like this: > This line starts the blockquote * This list is part of the quote. * Second item. This paragraph is not part of the blockquote. The trailing paragraph was incorrectly included in the blockquote. (The solution was to add an extra "\n" after lists.) * The contents of `
` tags inside `
` are no longer indented in the HTML output. * PHP Markdown can now be used as a modifier by the Smarty templating engine. Rename the file to "modifier.markdown.php" and put it in your smarty plugins folder. * Now works as a bBlog formatter. Rename the file to "modifier.markdown.php" and place it in the "bBlog_plugins" folder. 1.0fc1: Wed 8 Jul 2004 * Greatly simplified the rules for code blocks. No more colons necessary; if it's indented (4 spaces or 1 tab), it's a code block. * Unordered list items can now be denoted by any of the following bullet markers: [*+-] * Replacing `"` with `"` to fix literal quotes within title attributes. 1.0b9: Sun 27 Jun 2004 * Replacing `"` with `"` to fix literal quotes within img alt attributes. 1.0b8: Wed 23 Jun 2004 * In WordPress, solved a bug where PHP Markdown did not deactivate the paragraph filter, converting all returns to a line break. The "texturize" filter was being disabled instead. * Added 'math' tags to block-level tag patterns in `_HashHTMLBlocks()`. Please disregard all the 'math'-tag related items in 1.0b7. * Commented out some vestigial code in `_EscapeSpecialChars()` 1.0b7: Sat 12 Jun 2004 * Added 'math' to `$tags_to_skip` pattern, for MathML users. * Tweaked regex for identifying HTML entities in `_EncodeAmpsAndAngles()`, so as to allow for the very long entity names used by MathML. (Thanks to Jacques Distler for the patch.) * Changed the internals of `_TokenizeHTML` to lower the PHP version requirement to PHP 4.0.5. 1.0b6: Sun 6 Jun 2004 * Added a WordPress plugin interface. This means that you can directly put the "markdown.php" file into the "wp-content/plugins" directory and then activate it from the administrative interface. * Added a Textile compatibility interface. Rename this file to "classTextile.php" and it can replace Textile anywhere. * The title attribute of reference-style links were ignored. This is now fixed. * Changed internal variables names so that they begin with `md_` instead of `g_`. This should reduce the risk of name collision with other programs. 1.0b5: Sun 2 May 2004 * Workaround for supporting `` and `` as block-level tags. This only works if the start and end tags are on lines by themselves. * Three or more underscores can now be used for horizontal rules. * Lines containing only whitespace are trimmed from blockquotes. * You can now optionally wrap URLs with angle brackets -- like so: `` -- in link definitions and inline links and images. * `_` and `*` characters in links and images are no longer escaped as HTML entities. Instead, we use the ridiculous but effective MD5 hashing trick that's used to hide these characters elsewhere. The end result is that the HTML output uses the literal `*` and `_` characters, rather than the ugly entities. * Passing an empty string to the Markdown function no longer creates an empty paragraph. * Added a global declaration at the beginning of the file. This means you can now `include 'markdown.php'` from inside a function. 1.0b4.1: Sun 4 Apr 2004 * Fixed a bug where image tags did not close. * Fixed a bug where brakets `[]` inside a link caused the link to be ignored. PHP Markdown support only 6 (!) level of brakets inside a link (while John's original version of Markdown in Perl support much more). 1.0b4: Sat 27 Mar 2004 * First release of PHP Markdown, based on the 1.0b4 release. Author & Contributors --------------------- Original version by John Gruber PHP translation by Michel Fortin First WordPress plugin interface written by Matt Mullenweg Copyright and License --------------------- Copyright (c) 2004 Michel Fortin All rights reserved. Copyright (c) 2003-2004 John Gruber All rights reserved. Markdown is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. Markdown is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. */ ?>

'._RunSpanGamut(_UnslashQuotes('\\1')).'

`'._RunSpanGamut(_UnslashQuotes('\\1')).'`