lib/transform.php

   1 <?php rcs_id('$Id: transform.php,v 1.31 2001-12-18 18:47:29 dairiki Exp $');
   2 require_once('lib/WikiPlugin.php');
   3
   4 define('WT_SIMPLE_MARKUP', 0);
   5 define('WT_TOKENIZER', 1);
   6 define('WT_MODE_MARKUP', 2);
   7
   8 define("ZERO_LEVEL", 0);
   9 define("NESTED_LEVEL", 1);
  10
  11 class WikiTransform
  12 {
  13    // public variables (only meaningful during do_transform)
  14    var $linenumber;     // current linenumber
  15    var $replacements;   // storage for tokenized strings of current line
  16    var $user_data;      // can be used by the transformer functions
  17                         // to store miscellaneous data.
  18
  19    // private variables
  20    var $content;        // wiki markup, array of lines
  21    var $mode_set;       // stores if a HTML mode for this line has been set
  22    var $trfrm_func;     // array of registered functions
  23    var $stack;          // stack for SetHTMLMode (keeping track of open tags)
  24
  25    /** init function */
  26    function WikiTransform()
  27    {
  28       $this->trfrm_func = array();
  29       $this->stack = new Stack;
  30    }
  31
  32    /**
  33     * Register transformation functions
  34     *
  35     * This should be done *before* calling do_transform
  36     *
  37     * @param $type enum  <dl>
  38     * <dt>WT_MODE_MARKUP</dt>
  39     * <dd>If one WT_MODE_MARKUP really sets the html mode, then
  40     *     all successive WT_MODE_MARKUP functions are skipped.</dd>
  41     * <dt>WT_TOKENIZER</dt>
  42     * <dd> The transformer function is called once for each match
  43     *      of the $regexp in the line.  The matched values are tokenized
  44     *      to protect them from further transformation.</dd>
  45     *
  46     * @param $function string  Function name
  47     * @param $regexp string  Required for WT_TOKENIZER functions.
  48     * Optional for others. If given, the transformer function will only be
  49     * called if the line matches the $regexp.
  50     */
  51    function register($type, $function, $regexp = false)
  52    {
  53       $this->trfrm_func[] = array ($type, $function, $regexp);
  54    }
  55
  56    /**
  57     * Sets current mode like list, preformatted text, plain text
  58     *
  59     * Takes care of closing (open) tags
  60     *
  61     * This is a helper function used to keep track of what HTML
  62     * block-level element we are currently processing.
  63     * Block-level elements are things like paragraphs "<p>",
  64     * pre-formatted text "<pre>", and the various list elements:
  65     * "<ul>", "<ol>" and "<dl>".  Now, SetHTMLMode is also used to
  66     * keep track of "<li>" and "<dd>" elements. Note that some of these elements
  67     * can be nested, while others can not.  (In particular, according to
  68     * the HTML 4.01 specification,  a paragraph "<p>" element is not
  69     * allowed to contain any other block-level elements.  Also <pre>,
  70     * <li>,  <dt>, <dd>, <h1> ... have this same restriction.)
  71     *
  72     * SetHTMLMode generates whatever HTML is necessary to get us into
  73     * the requested element type at the requested nesting level.
  74     *
  75     * @param $tag string Type of HTML element to open.
  76     *
  77     * If $tag is an array, $tag[0] gives the element type,
  78     * and $tag[1] should be a hash containing attribute-value
  79     * pairs for the element.
  80     *
  81     * If $tag is the empty string, all open elements (down to the
  82     * level requested by $level) are closed.  Use
  83     * SetHTMLMode('',0) to close all open block-level elements.
  84     *
  85     * @param $level string  Rrequested nesting level for current element.
  86     * The nesting level for top level block is one (which is
  87     * the default).
  88     * Nesting is arbitrary limited to 20 levels.
  89     *
  90     * @return string Returns the HTML markup to open the specified element.
  91     */
  92    function SetHTMLMode($tag, $level = 1)
  93    {
  94       if (is_array($tag)) {
  95          $args = $tag[1];
  96          $tag = $tag[0];
  97       }
  98       else {
  99          $args = array();
 100       }
 101
 102       $this->mode_set = 1;      // in order to prevent other mode markup
 103                                 // to be executed
 104       $retvar = '';
 105
 106       if ($level > 20) {
 107          // arbitrarily limit tag nesting
 108          ExitWiki(gettext ("Lists nested too deep in SetHTMLOutputMode"));
 109       }
 110
 111       if ($level <= $this->stack->cnt()) {
 112          // $tag has fewer nestings (old: tabs) than stack,
 113          // reduce stack to that tab count
 114          while ($this->stack->cnt() > $level) {
 115             $closetag = $this->stack->pop();
 116             assert('$closetag != false');
 117             $retvar .= "</$closetag>\n";
 118          }
 119
 120          // if list type isn't the same,
 121          // back up one more and push new tag
 122          if ($tag && $tag != $this->stack->top()) {
 123             $closetag = $this->stack->pop();
 124             $retvar .= "</$closetag>" . StartTag($tag, $args) . "\n";
 125             $this->stack->push($tag);
 126          }
 127
 128       }
 129       else {// $level > $this->stack->cnt()
 130          // Test for and close top level elements which are not allowed to contain
 131          // other block-level elements.
 132          if ($this->stack->cnt() == 1 and
 133              preg_match('/^(p|pre|h\d)$/i', $this->stack->top()))
 134          {
 135             $closetag = $this->stack->pop();
 136             $retvar .= "</$closetag>";
 137          }
 138
 139          // we add the diff to the stack
 140          // stack might be zero
 141          if ($this->stack->cnt() < $level) {
 142             while ($this->stack->cnt() < $level - 1) {
 143                // This is a bit of a hack:
 144                //
 145                // We're not nested deep enough, and have to make up some kind of block
 146                // element to nest within.
 147                //
 148                // Currently, this can only happen for nested list element
 149                // (either <ul> <ol> or <dl>).  What we used to do here is
 150                // to open extra lists of whatever type was requested.
 151                // This would result in invalid HTML, since and list is
 152                // not allowed to contain another list without first containing
 153                // a list item.  ("<ul><ul><li>Item</ul></ul>" is invalid.)
 154                //
 155                // So now, when we need extra list elements, we use a <dl>, and
 156                // open it with an empty <dd>.
 157                $el =  $this->stack->cnt() % 2 == 0 ? 'dl' : 'dd';
 158                $retvar .= "<$el>";
 159                $this->stack->push($el);
 160             }
 161
 162             $retvar .= StartTag($tag, $args) . "\n";
 163             $this->stack->push($tag);
 164          }
 165       }
 166
 167       return $this->token($retvar);
 168    }
 169
 170    /**
 171     * Start new list item element.
 172     *
 173     * This closes any currently open list items at the specified level or deeper,
 174     * then opens a new list item element.
 175     *
 176     * @param $list_type string  Type of list element to open.  This should
 177     * be one of 'dl', 'ol', or 'ul'.
 178     *
 179     * @param $level integer  Nesting depth for list item.  Should be a positive integer.
 180     *
 181     * @param $defn_term string  Definition term.  Specifies the contents for the
 182     * &lt;dt&gt; element.  Only used if $list_type is 'dl'.
 183     *
 184     * @return string HTML
 185     */
 186    function ListItem($list_type, $level, $defn_term = '')
 187    {
 188        $level = min($level, 10);
 189
 190        $retval = $this->SetHTMLMode($list_type, 2 * $level - 1);
 191        if ($list_type == 'dl') {
 192            $retval .= Element('dt', $defn_term);
 193            $retval .= $this->SetHTMLMode('dd', 2 * $level);
 194        }
 195        else {
 196            $retval .= $this->SetHTMLMode('li', 2 * $level);
 197        }
 198        return $retval;
 199    }
 200
 201
 202    /** Work horse and main loop.
 203     *
 204     * This function does the transform from wiki markup to HTML.
 205     *
 206     * Contains main-loop and calls transformer functions.
 207     *
 208     * @param $html string  HTML header (if needed, otherwise '')
 209     * (This string is prepended to the return value.)
 210     *
 211     * @param $content array  Wiki markup as array of lines
 212     *
 213     * @return string HTML
 214     */
 215    function do_transform($html, $content)
 216    {
 217       global $FieldSeparator;
 218
 219       $this->content = $content;
 220       $this->replacements = array();
 221       $this->user_data = array();
 222
 223       // Loop over all lines of the page and apply transformation rules
 224       $numlines = count($this->content);
 225       for ($lnum = 0; $lnum < $numlines; $lnum++)
 226       {
 227
 228          $this->linenumber = $lnum;
 229          $line = $this->content[$lnum];
 230
 231          // blank lines clear the current mode (to force new paragraph)
 232          if (!strlen($line) || $line == "\r") {
 233             $html .= $this->SetHTMLMode('', 0);
 234             continue;
 235          }
 236
 237          $this->mode_set = 0;
 238
 239          // main loop applying all registered functions
 240          // tokenizers, markup, html mode, ...
 241          // functions are executed in order of registering
 242          for (reset($this->trfrm_func);
 243               list($flags, $func, $regexp) = current($this->trfrm_func);
 244               next($this->trfrm_func)) {
 245
 246             // if HTMLmode is already set then skip all following
 247             // WT_MODE_MARKUP functions
 248             if ($this->mode_set && ($flags & WT_MODE_MARKUP) != 0)
 249                continue;
 250
 251             if (!empty($regexp) && !preg_match("/$regexp/", $line))
 252                continue;
 253
 254             // call registered function
 255             if (($flags & WT_TOKENIZER) != 0)
 256                $line = $this->tokenize($line, $regexp, $func);
 257             else
 258                $line = $func($line, $this);
 259          }
 260
 261          $html .= $line . "\n";
 262       }
 263       // close all tags
 264       $html .= $this->SetHTMLMode('', 0);
 265
 266       return $this->untokenize($html);
 267    }
 268    // end do_transfrom()
 269
 270    // Register a new token.
 271    function token($repl) {
 272       global $FieldSeparator;
 273       $tok = $FieldSeparator . sizeof($this->replacements) . $FieldSeparator;
 274       $this->replacements[] = $repl;
 275       return $tok;
 276    }
 277
 278    // helper function which does actual tokenizing
 279    function tokenize($str, $pattern, $func) {
 280       // Find any strings in $str that match $pattern and
 281       // store them in $orig, replacing them with tokens
 282       // starting at number $ntokens - returns tokenized string
 283       $new = '';
 284       while (preg_match("/^(.*?)($pattern)/", $str, $matches)) {
 285          $str = substr($str, strlen($matches[0]));
 286          $new .= $matches[1] . $this->token($func($matches[2], $this));
 287       }
 288       return $new . $str;
 289    }
 290
 291    function untokenize($line) {
 292       global $FieldSeparator;
 293
 294       $chunks = explode ($FieldSeparator, "$line ");
 295       $line = $chunks[0];
 296       for ($i = 1; $i < count($chunks); $i += 2)
 297       {
 298          $tok = $chunks[$i];
 299          $line .= $this->replacements[$tok] . $chunks[$i + 1];
 300       }
 301       return $line;
 302    }
 303 }
 304 // end class WikiTransform
 305
 306
 307 //////////////////////////////////////////////////////////
 308
 309 class WikiPageTransform
 310 extends WikiTransform {
 311     function WikiPageTransform() {
 312         global $WikiNameRegexp, $AllowedProtocols, $InterWikiLinkRegexp;
 313
 314         $this->WikiTransform();
 315
 316         // register functions
 317         // functions are applied in order of registering
 318
 319         $this->register(WT_SIMPLE_MARKUP, 'wtm_plugin_link');
 320         $this->register(WT_MODE_MARKUP, 'wtm_plugin');
 321
 322         $this->register(WT_TOKENIZER, 'wtt_doublebrackets', '\[\[');
 323         $this->register(WT_TOKENIZER, 'wtt_footnotes', '^\[\d+\]');
 324         $this->register(WT_TOKENIZER, 'wtt_footnoterefs', '\[\d+\]');
 325         $this->register(WT_TOKENIZER, 'wtt_bracketlinks', '\[.+?\]');
 326         $this->register(WT_TOKENIZER, 'wtt_urls',
 327                         "!?\b($AllowedProtocols):[^\s<>\[\]\"'()]*[^\s<>\[\]\"'(),.?]");
 328
 329         if (function_exists('wtt_interwikilinks')) {
 330             $this->register(WT_TOKENIZER, 'wtt_interwikilinks',
 331                             pcre_fix_posix_classes("!?(?<![[:alnum:]])") .
 332                             "$InterWikiLinkRegexp:[^\\s.,;?()]+");
 333         }
 334         $this->register(WT_TOKENIZER, 'wtt_bumpylinks', "!?$WikiNameRegexp");
 335
 336         if (function_exists('wtm_table')) {
 337             $this->register(WT_MODE_MARKUP, 'wtm_table', '^\|');
 338         }
 339         $this->register(WT_SIMPLE_MARKUP, 'wtm_htmlchars');
 340         $this->register(WT_SIMPLE_MARKUP, 'wtm_linebreak');
 341         $this->register(WT_SIMPLE_MARKUP, 'wtm_bold_italics');
 342
 343         $this->register(WT_MODE_MARKUP, 'wtm_list_ul');
 344         $this->register(WT_MODE_MARKUP, 'wtm_list_ol');
 345         $this->register(WT_MODE_MARKUP, 'wtm_list_dl');
 346         $this->register(WT_MODE_MARKUP, 'wtm_preformatted');
 347         $this->register(WT_MODE_MARKUP, 'wtm_headings');
 348         $this->register(WT_MODE_MARKUP, 'wtm_hr');
 349         $this->register(WT_MODE_MARKUP, 'wtm_paragraph');
 350     }
 351 };
 352
 353 function do_transform ($lines, $class = 'WikiPageTransform') {
 354     if (is_string($lines))
 355         $lines = preg_split('/[ \t\r]*\n/', trim($lines));
 356
 357     $trfm = new $class;
 358     return $trfm->do_transform('', $lines);
 359 }
 360
 361 class LinkTransform
 362 extends WikiTransform {
 363     function LinkTransform() {
 364         global $WikiNameRegexp, $AllowedProtocols, $InterWikiLinkRegexp;
 365
 366         $this->WikiTransform();
 367
 368         // register functions
 369         // functions are applied in order of registering
 370
 371         $this->register(WT_TOKENIZER, 'wtt_doublebrackets', '\[\[');
 372         $this->register(WT_TOKENIZER, 'wtt_quotetoken', '\[\d+\]');
 373         $this->register(WT_TOKENIZER, 'wtt_bracketlinks', '\[.+?\]');
 374         $this->register(WT_TOKENIZER, 'wtt_urls',
 375                         "!?\b($AllowedProtocols):[^\s<>\[\]\"'()]*[^\s<>\[\]\"'(),.?]");
 376
 377         if (function_exists('wtt_interwikilinks')) {
 378             $this->register(WT_TOKENIZER, 'wtt_interwikilinks',
 379                             pcre_fix_posix_classes("!?(?<![[:alnum:]])") .
 380                             "$InterWikiLinkRegexp:[^\\s.,;?()]+");
 381         }
 382         $this->register(WT_TOKENIZER, 'wtt_bumpylinks', "!?$WikiNameRegexp");
 383         $this->register(WT_SIMPLE_MARKUP, 'wtm_htmlchars');
 384     }
 385 };
 386
 387 /*
 388 Requirements for functions registered to WikiTransform:
 389
 390 Signature:  function wtm_xxxx($line, &$transform)
 391
 392 $line ... current line containing wiki markup
 393         (Note: it may already contain HTML from other transform functions)
 394 &$transform ... WikiTransform object -- public variables of this
 395         object and their use see above.
 396
 397 Functions have to return $line (doesn't matter if modified or not)
 398 All conversion should take place inside $line.
 399
 400 Tokenizer functions should use $transform->replacements to store
 401 the replacement strings. Also, they have to keep track of
 402 $transform->tokencounter. See functions below. Back substitution
 403 of tokenized strings is done by do_transform().
 404 */
 405
 406
 407
 408    //////////////////////////////////////////////////////////
 409    // Tokenizer functions
 410
 411
 412 function  wtt_doublebrackets($match, &$trfrm)
 413 {
 414    return '[';
 415 }
 416
 417 function wtt_footnotes($match, &$trfrm)
 418 {
 419    // FIXME: should this set HTML mode?
 420    $ftnt = trim(substr($match,1,-1)) + 0;
 421    $fntext = "[$ftnt]";
 422    $html = Element('br');
 423
 424    $fnlist = $trfrm->user_data['footnotes'][$ftnt];
 425    if (!is_array($fnlist))
 426       return $html . $fntext;
 427
 428    $trfrm->user_data['footnotes'][$ftnt] = 'footnote_seen';
 429
 430    while (list($k, $anchor) = each($fnlist))
 431    {
 432       $html .=  Element("a", array("name" => "footnote-$ftnt",
 433                                    "href" => "#$anchor",
 434                                    "class" => "footnote-rev"),
 435                         $fntext);
 436       $fntext = '+';
 437    }
 438    return $html;
 439 }
 440
 441 function wtt_footnoterefs($match, &$trfrm)
 442 {
 443    $ftnt = trim(substr($match,1,-1)) + 0;
 444
 445    $footnote_definition_seen = false;
 446
 447    if (empty($trfrm->user_data['footnotes']))
 448       $trfrm->user_data['footnotes'] = array();
 449    if (empty($trfrm->user_data['footnotes'][$ftnt]))
 450       $trfrm->user_data['footnotes'][$ftnt] = array();
 451    else if (!is_array($trfrm->user_data['footnotes'][$ftnt]))
 452       $footnote_definition_seen = true;
 453
 454
 455    $args['href'] = "#footnote-$ftnt";
 456    if (!$footnote_definition_seen)
 457    {
 458       $args['name'] = "footrev-$ftnt-" .
 459           count($trfrm->user_data['footnotes'][$ftnt]);
 460       $trfrm->user_data['footnotes'][$ftnt][] = $args['name'];
 461    }
 462
 463    return Element('sup', array('class' => 'footnote'),
 464                   QElement("a", $args, "[$ftnt]"));
 465 }
 466
 467 function wtt_bracketlinks($match, &$trfrm)
 468 {
 469     if (preg_match('/^\[\s*\]$/', $match)) {
 470         return htmlspecialchars($match);
 471     }
 472
 473     $link = ParseAndLink($match);
 474     if (strstr($link['link'], "</form>")) {
 475         // FIXME: BIG HACK: see note in wtm_plugin.
 476         return "</p>" . $link['link'] . "<p>";
 477     }
 478     return $link["link"];
 479 }
 480
 481
 482
 483 // replace all URL's with tokens, so we don't confuse them
 484 // with Wiki words later. Wiki words in URL's break things.
 485 // URLs preceeded by a '!' are not linked
 486 function wtt_urls($match, &$trfrm)
 487 {
 488    if ($match[0] == "!")
 489       return htmlspecialchars(substr($match,1));
 490    return LinkURL($match);
 491 }
 492
 493 // Link Wiki words (BumpyText)
 494 // Wikiwords preceeded by a '!' are not linked
 495 function wtt_bumpylinks($match, &$trfrm)
 496 {
 497    global $dbi;
 498    if ($match[0] == "!")
 499       return htmlspecialchars(substr($match,1));
 500    return LinkWikiWord($match);
 501 }
 502
 503
 504 // Just quote the token.
 505 function wtt_quotetoken($match, &$trfrm)
 506 {
 507     return htmlspecialchars($match);
 508 }
 509
 510
 511
 512 // end of tokenizer functions
 513 //////////////////////////////////////////////////////////
 514
 515
 516    //////////////////////////////////////////////////////////
 517    // basic simple markup functions
 518
 519    // escape HTML metachars
 520    function wtm_htmlchars($line, &$transformer)
 521    {
 522       $line = str_replace('&', '&amp;', $line);
 523       $line = str_replace('>', '&gt;', $line);
 524       $line = str_replace('<', '&lt;', $line);
 525       return($line);
 526    }
 527
 528
 529    // %%% are linebreaks
 530    function wtm_linebreak($line, &$transformer) {
 531       return str_replace('%%%', Element('br'), $line);
 532    }
 533
 534    // bold and italics
 535    function wtm_bold_italics($line, &$transformer) {
 536       $line = preg_replace('|(__)(.*?)(__)|', '<strong>\2</strong>', $line);
 537       $line = preg_replace("|('')(.*?)('')|", '<em>\2</em>', $line);
 538       return $line;
 539    }
 540
 541
 542
 543    //////////////////////////////////////////////////////////
 544    // some tokens to be replaced by (dynamic) content
 545
 546 // FIXME: some plugins are in-line (maybe?) and some are block level.
 547 // Here we treat them all as inline, which will probably
 548 // generate some minorly invalid HTML in some cases.
 549 //
 550 function wtm_plugin_link($line, &$transformer) {
 551     // FIXME: is this good syntax?
 552     global $dbi, $request;      // FIXME: make these non-global?
 553
 554     if (preg_match('/^(.*?)(<\?plugin-link\s+.*?\?>)(.*)$/', $line, $m)) {
 555         list(, $prematch, $plugin_pi, $postmatch) = $m;
 556         $loader = new WikiPluginLoader;
 557         $html = $loader->expandPI($plugin_pi, $dbi, $request);
 558         $line = $prematch . $transformer->token($html) . $postmatch;
 559     }
 560     return $line;
 561 }
 562
 563 function wtm_plugin($line, &$transformer) {
 564     // FIXME: is this good syntax?
 565     global $dbi, $request;      // FIXME: make these non-global?
 566
 567     if (preg_match('/^<\?plugin(-form)?\s.*\?>\s*$/', $line)) {
 568         $loader = new WikiPluginLoader;
 569         $html = $loader->expandPI($line, $dbi, $request);
 570         $line = $transformer->SetHTMLMode('', 0) . $transformer->token($html);
 571     }
 572     return $line;
 573 }
 574
 575
 576    //////////////////////////////////////////////////////////
 577    // mode markup functions
 578
 579
 580    // tabless markup for unordered, ordered, and dictionary lists
 581    // ul/ol list types can be mixed, so we only look at the last
 582    // character. Changes e.g. from "**#*" to "###*" go unnoticed.
 583    // and wouldn't make a difference to the HTML layout anyway.
 584
 585    // unordered lists <UL>: "*"
 586    // has to be registereed before list OL
 587    function wtm_list_ul($line, &$trfrm) {
 588       if (preg_match("/^([#*;]*\*)[^#]/", $line, $matches)) {
 589          $numtabs = strlen($matches[1]);
 590          $line = preg_replace("/^([#*]*\*)/", '', $line);
 591          $line = $trfrm->ListItem('ul', $numtabs) . $line;
 592       }
 593       return $line;
 594    }
 595
 596    // ordered lists <OL>: "#"
 597    function wtm_list_ol($line, &$trfrm) {
 598       if (preg_match("/^([#*;]*\#)/", $line, $matches)) {
 599          $numtabs = strlen($matches[1]);
 600          $line = preg_replace("/^([#*]*\#)/", "", $line);
 601          $line = $trfrm->ListItem('ol', $numtabs) . $line;
 602       }
 603       return $line;
 604    }
 605
 606
 607    // definition lists <DL>: ";text:text"
 608    function wtm_list_dl($line, &$trfrm) {
 609       if (preg_match("/^([#*;]*;)(.*?):(.*$)/", $line, $matches)) {
 610          $numtabs = strlen($matches[1]);
 611          $line = $trfrm->ListItem('dl', $numtabs, $matches[2]) . $matches[3];
 612       }
 613       return $line;
 614    }
 615
 616    // mode: preformatted text, i.e. <pre>
 617    function wtm_preformatted($line, &$trfrm) {
 618       if (preg_match("/^\s+/", $line)) {
 619          $line = $trfrm->SetHTMLMode('pre') . $line;
 620       }
 621       return $line;
 622    }
 623
 624    // mode: headings, i.e. <h1>, <h2>, <h3>
 625    // lines starting with !,!!,!!! are headings
 626    // Patch from steph/tara <tellme@climbtothestars.org>:
 627    //    use <h2>, <h3>, <h4> since <h1> is page title.
 628    function wtm_headings($line, &$trfrm) {
 629       if (preg_match("/^(!{1,3})[^!]/", $line, $whichheading)) {
 630          if($whichheading[1] == '!') $heading = 'h4';
 631          elseif($whichheading[1] == '!!') $heading = 'h3';
 632          elseif($whichheading[1] == '!!!') $heading = 'h2';
 633          $line = preg_replace("/^!+/", '', $line);
 634          $line = $trfrm->SetHTMLMode($heading) . $line;
 635       }
 636       return $line;
 637    }
 638
 639 // markup for tables
 640 function wtm_table($line, &$trfrm)
 641 {
 642    $row = '';
 643    while (preg_match('/^(\|+)(v*)([<>^]?)([^|]*)/', $line, $m))
 644    {
 645       $line = substr($line, strlen($m[0]));
 646       $td = array();
 647
 648       if (strlen($m[1]) > 1)
 649          $td['colspan'] = strlen($m[1]);
 650       if (strlen($m[2]) > 0)
 651          $td['rowspan'] = strlen($m[2]) + 1;
 652
 653       if ($m[3] == '^')
 654          $td['align'] = 'center';
 655       else if ($m[3] == '>')
 656          $td['align'] = 'right';
 657       else
 658          $td['align'] = 'left';
 659
 660       $row .= $trfrm->token(StartTag('td', $td) . "&nbsp;");
 661       $row .= trim($m[4]);
 662       $row .= $trfrm->token("&nbsp;</td>");
 663    }
 664    assert(empty($line));
 665    $row = $trfrm->token("<tr>") . $row . $trfrm->token("</tr>");
 666
 667    return $trfrm->SetHTMLMode(array('table',
 668                                     array(//'align' => 'left',
 669                                           'cellpadding' => 1,
 670                                           'cellspacing' => 1,
 671                                           'border' => 1))) .
 672       $row;
 673 }
 674
 675    // four or more dashes to <hr>
 676    // Note this is of type WT_MODE_MARKUP becuase <hr>'s aren't
 677    // allowed within <p>'s. (e.g. "<p><hr></p>" is not valid HTML.)
 678    function wtm_hr($line, &$trfrm) {
 679       if (preg_match('/^-{4,}(.*)$/', $line, $m)) {
 680          $line = $trfrm->SetHTMLMode('', 0) . Element('hr');
 681          if ($m[1])
 682             $line .= $trfrm->SetHTMLMode('p') . $m[1];
 683       }
 684       return $line;
 685    }
 686
 687    // default mode: simple text paragraph
 688    function wtm_paragraph($line, &$trfrm) {
 689       $line = $trfrm->SetHTMLMode('p') . $line;
 690       return $line;
 691    }
 692
 693 // (c-file-style: "gnu")
 694 // Local Variables:
 695 // mode: php
 696 // tab-width: 8
 697 // c-basic-offset: 4
 698 // c-hanging-comment-ender-p: nil
 699 // indent-tabs-mode: nil
 700 // End:
 701 ?>