3 * Copyright 1999-2008 $ThePhpWikiProgrammingTeam
4 * Copyright 2008-2009 Marc-Etienne Vargenau, Alcatel-Lucent
6 * This file is part of PhpWiki.
8 * PhpWiki is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation; either version 2 of the License, or
11 * (at your option) any later version.
13 * PhpWiki is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
18 * You should have received a copy of the GNU General Public License along
19 * with PhpWiki; if not, write to the Free Software Foundation, Inc.,
20 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
24 Standard functions for Wiki functionality
25 WikiURL ($pagename, $args, $get_abs_url)
27 IconForLink ($protocol_or_url)
28 PossiblyGlueIconToText($proto_or_url, $text)
30 LinkURL ($url, $linktext)
31 LinkImage ($url, $alt)
32 ImgObject ($img, $url)
34 SplitQueryArgs ($query_args)
35 LinkPhpwikiURL ($url, $text, $basepage)
36 MangleXmlIdentifier($str)
38 class Stack { push($item), pop(), cnt(), top() }
39 class Alert { show() }
40 class WikiPageName {getParent(),isValid(),getWarnings() }
42 expand_tabs($str, $tab_width = 8)
44 NoSuchRevision ($request, $page, $version)
45 TimezoneOffset ($time, $no_colon)
46 Iso8601DateTime ($time)
47 Rfc2822DateTime ($time)
48 ParseRfc1123DateTime ($timestr)
50 ByteFormatter ($bytes = 0, $longformat = false)
53 __vsprintf ($fmt, $args)
55 file_mtime ($filename)
56 sort_file_mtime ($a, $b)
57 class fileSet {fileSet($directory, $filepattern = false),
58 getFiles($exclude='', $sortby='', $limit='') }
59 class ListRegexExpand { listMatchCallback($item, $key),
60 expandRegex ($index, &$pages) }
63 glob_match ($glob, $against, $case_sensitive = true)
64 explodeList ($input, $allnames, $glob_style = true, $case_sensitive = true)
65 explodePageList ($input, $perm = false)
67 can ($object, $method)
68 function_usable ($function_name)
72 subPageSlice ($pagename, $pos)
73 isActionPage ($filename)
77 obj2hash ($obj, $exclude = false, $fields = false)
80 url_get_contents ($uri)
82 firstNWordsOfContent ($n, $content)
83 extractSection ($section, $content, $page, $quiet = false, $sectionhead = false)
86 string_starts_with($string, $prefix)
87 string_ends_with($string, $suffix)
88 array_remove($arr,$value)
89 longer_timeout($secs=30)
92 binary_search($needle, $haystack)
94 javascript_quote_string($s)
97 parse_attributes($line)
101 function: linkExistingWikiWord($wikiword, $linktext, $version)
102 moved to: lib/WikiTheme.php
104 if (defined('_PHPWIKI_STDLIB_LOADED')) return;
105 else define('_PHPWIKI_STDLIB_LOADED', true);
107 if (!defined('MAX_PAGENAME_LENGTH')) {
108 define('MAX_PAGENAME_LENGTH', 100);
112 * Convert string to a valid XML identifier.
114 * XML 1.0 identifiers are of the form: [A-Za-z][A-Za-z0-9:_.-]*
116 * We would like to have, e.g. named anchors within wiki pages
117 * names like "Table of Contents" --- clearly not a valid XML
118 * fragment identifier.
120 * This function implements a one-to-one map from {any string}
121 * to {valid XML identifiers}.
124 * converting all bytes not in [A-Za-z0-9:_-],
125 * and any leading byte not in [A-Za-z] to '.bb',
126 * where 'bb' is the hexadecimal representation of the
129 * As a special case, the empty string is converted to 'empty.'
134 function MangleXmlIdentifier($str)
139 return preg_replace_callback(
140 '/[^-_:A-Za-z0-9]|(?<=^)[^A-Za-z]/',
142 return '.' . sprintf('%02x', ord('$m'));
148 * Returns a name for the WIKI_ID cookie that should be unique on the host.
149 * But for it to be unique you must have set a unique WIKI_NAME in your
150 * configuration file.
151 * @return string The name of the WIKI_ID cookie to use for this wiki.
153 function getCookieName()
155 return preg_replace("/[^\d\w]/", "_", WIKI_NAME) . "_WIKI_ID";
159 * Generates a valid URL for a given Wiki pagename.
160 * @param mixed $pagename If a string this will be the name of the Wiki page to link to.
161 * If a WikiDB_Page object function will extract the name to link to.
162 * If a WikiDB_PageRevision object function will extract the name to link to.
164 * @param bool $get_abs_url Default value is false.
165 * @return string The absolute URL to the page passed as $pagename.
167 function WikiURL($pagename, $args = array(), $get_abs_url = false)
169 global $request, $WikiTheme;
172 if (is_object($pagename)) {
173 if (isa($pagename, 'WikiDB_Page')) {
174 $pagename = $pagename->getName();
175 } elseif (isa($pagename, 'WikiDB_PageRevision')) {
176 $page = $pagename->getPage();
177 $args['version'] = $pagename->getVersion();
178 $pagename = $page->getName();
179 } elseif (isa($pagename, 'WikiPageName')) {
180 $anchor = $pagename->anchor;
181 $pagename = $pagename->name;
183 $anchor = $pagename->anchor;
184 $pagename = $pagename->name;
187 if (!$get_abs_url and DEBUG and $request->getArg('start_debug')) {
189 $args = 'start_debug=' . $request->getArg('start_debug');
190 elseif (is_array($args))
191 $args['start_debug'] = $request->getArg('start_debug'); else
192 $args .= '&start_debug=' . $request->getArg('start_debug');
194 if (is_array($args)) {
196 foreach ($args as $key => $val) {
197 // avoid default args
198 if (USE_PATH_INFO and $key == 'pagename')
200 elseif ($key == 'action' and $val == 'browse')
201 ; elseif (!is_array($val)) // ugly hack for getURLtoSelf() which also takes POST vars
202 $enc_args[] = urlencode($key) . '=' . urlencode($val);
204 $args = join('&', $enc_args);
207 if (USE_PATH_INFO or !empty($WikiTheme->HTML_DUMP_SUFFIX)) {
208 $url = $get_abs_url ? (SERVER_URL . VIRTUAL_PATH . "/") : "";
209 $base = preg_replace('/%2f/i', '/', rawurlencode($pagename));
211 if (!empty($WikiTheme->HTML_DUMP_SUFFIX)) {
212 if (!empty($WikiTheme->VALID_LINKS) and $request->getArg('action') == 'pdf') {
213 if (!in_array($pagename, $WikiTheme->VALID_LINKS))
216 $url = $base . $WikiTheme->HTML_DUMP_SUFFIX;
218 $url .= $WikiTheme->HTML_DUMP_SUFFIX;
227 $url = $get_abs_url ? SERVER_URL . SCRIPT_NAME : basename(SCRIPT_NAME);
228 $url .= "?pagename=" . rawurlencode($pagename);
233 $url .= "#" . MangleXmlIdentifier($anchor);
237 /** Convert relative URL to absolute URL.
239 * This converts a relative URL to one of PhpWiki's support files
240 * to an absolute one.
243 * @return string Absolute URL
245 function AbsoluteURL($url)
247 if (preg_match('/^https?:/', $url))
249 if ($url[0] != '/') {
250 $base = USE_PATH_INFO ? VIRTUAL_PATH : dirname(SCRIPT_NAME);
251 while ($base != '/' and substr($url, 0, 3) == "../") {
252 $url = substr($url, 3);
253 $base = dirname($base);
259 return SERVER_URL . $url;
262 function DataURL($url)
264 if (preg_match('/^https?:/', $url))
266 $url = NormalizeWebFileName($url);
267 if (DEBUG and $GLOBALS['request']->getArg('start_debug') and substr($url, -4, 4) == '.php')
268 $url .= "?start_debug=1"; // XMLRPC and SOAP debugging helper.
269 return AbsoluteURL($url);
273 * Generates icon in front of links.
275 * @param string $protocol_or_url URL or protocol to determine which icon to use.
277 * @return HtmlElement HtmlElement object that contains data to create img link to
278 * icon for use with url or protocol passed to the function. False if no img to be
281 function IconForLink($protocol_or_url)
285 if (0 and $filename_suffix == false) {
286 // display apache style icon for file type instead of protocol icon
287 // - archive: unix:gz,bz2,tgz,tar,z; mac:dmg,dmgz,bin,img,cpt,sit; pc:zip;
288 // - document: html, htm, text, txt, rtf, pdf, doc
289 // - non-inlined image: jpg,jpeg,png,gif,tiff,tif,swf,pict,psd,eps,ps
290 // - audio: mp3,mp2,aiff,aif,au
291 // - multimedia: mpeg,mpg,mov,qt
294 list ($proto) = explode(':', $protocol_or_url, 2);
295 $src = $WikiTheme->getLinkIconURL($proto);
297 return HTML::img(array('src' => $src, 'alt' => "", 'class' => 'linkicon'));
304 * Glue icon in front of or after text.
305 * Pref: 'noLinkIcons' - ignore icon if set
306 * WikiTheme: 'LinkIcons' - 'yes' at front
307 * - 'no' display no icon
308 * - 'front' display at left
309 * - 'after' display at right
311 * @param string $proto_or_url Protocol or URL. Used to determine the
313 * @param string $text The text.
314 * @return XmlContent.
316 function PossiblyGlueIconToText($proto_or_url, $text)
318 global $request, $WikiTheme;
319 if ($request->getPref('noLinkIcons'))
321 $icon = IconForLink($proto_or_url);
324 if ($where = $WikiTheme->getLinkIconAttr()) {
325 if ($where == 'no') return $text;
326 if ($where != 'after') $where = 'front';
330 if ($where == 'after') {
331 // span the icon only to the last word (tie them together),
332 // to let the previous words wrap on line breaks.
333 if (!is_object($text)) {
334 preg_match('/^(\s*\S*)(\s*)$/', $text, $m);
335 list (, $prefix, $last_word) = $m;
340 $text = HTML::span(array('style' => 'white-space: nowrap'),
341 $last_word, HTML::Raw(' '), $icon);
343 $text = HTML($prefix, $text);
346 // span the icon only to the first word (tie them together),
347 // to let the next words wrap on line breaks
348 if (!is_object($text)) {
349 preg_match('/^\s*(\S*)(.*?)\s*$/', $text, $m);
350 list (, $first_word, $tail) = $m;
355 $text = HTML::span(array('style' => 'white-space: nowrap'),
358 $text = HTML($text, $tail);
363 * Determines if the url passed to function is safe, by detecting if the characters
364 * '<', '>', or '"' are present.
365 * Check against their urlencoded values also.
367 * @param string $url URL to check for unsafe characters.
368 * @return boolean True if same, false else.
370 function IsSafeURL($url)
372 return !preg_match('/([<>"])|(%3C)|(%3E)|(%22)/', $url);
376 * Generates an HtmlElement object to store data for a link.
378 * @param string $url URL that the link will point to.
379 * @param string $linktext Text to be displayed as link.
380 * @return HtmlElement HtmlElement object that contains data to construct an html link.
382 function LinkURL($url, $linktext = '')
384 // FIXME: Is this needed (or sufficient?)
385 if (!IsSafeURL($url)) {
386 $link = HTML::span(array('class' => 'error'), _('Bad URL -- remove all of <, >, "'));
390 $linktext = preg_replace("/mailto:/A", "", $url);
391 $args = array('href' => $url);
392 if (defined('EXTERNAL_LINK_TARGET')) // can also be set in the css
393 $args['target'] = (is_string(EXTERNAL_LINK_TARGET) and (EXTERNAL_LINK_TARGET != "")) ? EXTERNAL_LINK_TARGET : "_blank";
394 $link = HTML::a($args, PossiblyGlueIconToText($url, $linktext));
396 $link->setAttr('class', $linktext ? 'namedurl' : 'rawurl');
403 * Syntax: [image.png size=50% border=n align= hspace= vspace= width= height=]
404 * Disallows sizes which are too small.
405 * Spammers may use such (typically invisible) image attributes to raise their GoogleRank.
407 * Handle embeddable objects, like svg, class, vrml, swf, svgz, pdf, avi, wmv especially.
409 function LinkImage($url, $alt = "")
411 $force_img = "png|jpg|gif|jpeg|bmp|pl|cgi";
412 // Disallow tags in img src urls. Typical CSS attacks.
413 // FIXME: Is this needed (or sufficient?)
414 // FIXED: This was broken for moniker:TP30 test/image.png => url="moniker:TP30" attr="test/image.png"
416 // support new syntax: [prefix/image.jpg size=50% border=n]
421 $arr = explode(' ', $url);
422 if (!empty($arr)) $url = $arr[0];
423 if (!IsSafeURL($url)) {
424 $link = HTML::span(array('class' => 'error'), _('Bad URL for image -- remove all of <, >, "'));
427 // spaces in inline images must be %20 encoded!
428 $link = HTML::img(array('src' => $url));
430 // Extract attributes
431 $arr = parse_attributes(strstr($ori_url, " "));
432 foreach ($arr as $attr => $value) {
433 // These attributes take strings: lang, id, title, alt
434 if (($attr == "lang")
436 || ($attr == "title")
439 $link->setAttr($attr, $value);
440 } // align = bottom|middle|top|left|right
441 // we allow "center" as synonym for "middle"
442 elseif (($attr == "align")
443 && (($value == "bottom")
444 || ($value == "middle")
445 || ($value == "center")
447 || ($value == "left")
448 || ($value == "right"))
450 if ($value == "center") {
453 $link->setAttr($attr, $value);
454 } // These attributes take a number (pixels): border, hspace, vspace
455 elseif ((($attr == "border") || ($attr == "hspace") || ($attr == "vspace"))
456 && (is_numeric($value))
458 $link->setAttr($attr, (int)$value);
459 } // These attributes take a number (pixels) or a percentage: height, width
460 elseif ((($attr == "height") || ($attr == "width"))
461 && (preg_match('/\d+[%p]?x?/', $value))
463 $link->setAttr($attr, $value);
464 } // We allow size=50% and size=20x30
465 // We replace this with "width" and "height" HTML attributes
466 elseif ($attr == "size") {
467 if (preg_match('/(\d+%)/', $value, $m)) {
468 $link->setAttr('width', $m[1]);
469 $link->setAttr('height', $m[1]);
470 } elseif (preg_match('/(\d+)x(\d+)/', $value, $m)) {
471 $link->setAttr('width', $m[1]);
472 $link->setAttr('height', $m[2]);
475 $url = substr(strrchr($ori_url, "/"), 1);
476 $link = HTML::span(array('class' => 'error'),
477 sprintf(_("Invalid attribute %s=%s for image %s"),
478 $attr, $value, $url));
482 // Correct silently the most common error
483 if ($url != $ori_url and empty($arr) and !preg_match("/^http/", $url)) {
484 // space belongs to the path
485 $file = NormalizeLocalFileName($ori_url);
486 if (file_exists($file)) {
487 $link = HTML::img(array('src' => $ori_url));
489 sprintf(_("Invalid image link fixed %s => %s. Spaces must be quoted with %%20."),
490 $url, $ori_url), E_USER_WARNING);
491 } elseif (string_starts_with($ori_url, getUploadDataPath())) {
492 $file = substr($file, strlen(getUploadDataPath()));
493 $path = getUploadFilePath() . $file;
494 if (file_exists($path)) {
495 trigger_error(sprintf(_("Invalid image link fixed \"%s\" => \"%s\".\n Spaces must be quoted with %%20."),
496 $url, $ori_url), E_USER_WARNING);
497 $link->setAttr('src', getUploadDataPath() . $file);
502 if (!$link->getAttr('alt')) {
503 $link->setAttr('alt', $alt);
505 // Check width and height as spam countermeasure
506 if (($width = $link->getAttr('width')) and ($height = $link->getAttr('height'))) {
507 //$width = (int) $width; // px or % or other suffix
508 //$height = (int) $height;
509 if (($width < 3 and $height < 10) or
510 ($height < 3 and $width < 20) or
511 ($height < 7 and $width < 7)
513 $link = HTML::span(array('class' => 'error'),
514 _("Invalid image size"));
519 // Prepare for getimagesize($url)
520 // $url only valid for external urls, otherwise local path
521 if (DISABLE_GETIMAGESIZE)
523 elseif (!preg_match("/\.$force_img$/i", $url))
524 ; // only valid image extensions or scripts assumed to generate images
525 elseif (preg_match("/^http/", $url)) { // external url
526 $size = @getimagesize($url);
527 } else { // local file
528 if (file_exists($file = NormalizeLocalFileName($url))) { // here
529 $size = @getimagesize($file);
530 } elseif (file_exists(NormalizeLocalFileName(urldecode($url)))) {
531 $size = @getimagesize($file);
532 $link->setAttr('src', rawurldecode($url));
533 } elseif (string_starts_with($url, getUploadDataPath())) { // there
534 $file = substr($file, strlen(getUploadDataPath()));
535 $path = getUploadFilePath() . rawurldecode($file);
536 $size = @getimagesize($path);
537 $link->setAttr('src', getUploadDataPath() . rawurldecode($file));
538 } else { // elsewhere
540 $size = @getimagesize($request->get('DOCUMENT_ROOT') . urldecode($url));
546 if (($width < 3 and $height < 10)
547 or ($height < 3 and $width < 20)
548 or ($height < 7 and $width < 7)
550 $link = HTML::span(array('class' => 'error'),
551 _("Invalid image size"));
556 $link->setAttr('class', 'inlineimage');
558 /* Check for inlined objects. Everything allowed in INLINE_IMAGES besides
559 * png|jpg|gif|jpeg|bmp|pl|cgi. If no image it is an object to embed.
560 * Note: Allow cgi's (pl,cgi) returning images.
562 if (!preg_match("/\.(" . $force_img . ")/i", $ori_url)) {
563 // HTML::img(array('src' => $url, 'alt' => $alt, 'title' => $alt));
564 // => HTML::object(array('src' => $url)) ...;
565 return ImgObject($link, $ori_url);
571 * <object> / <embed> tags instead of <img> for all non-image extensions
573 * Called by LinkImage(), not directly.
574 * Syntax: [image.svg size=50% alt=image.gif border=n align= hspace= vspace= width= height=]
575 * Samples: [Upload:song.mp3 type=audio/mpeg width=200 height=10]
576 * $alt may be an alternate img
577 * TODO: Need to unify with WikiPluginCached::embedObject()
579 * Note that Safari 1.0 will crash with <object>, so use only <embed>
580 * http://www.alleged.org.uk/pdc/2002/svg-object.html
582 * Allowed object tags:
584 * DATA=URI (object data)
585 * CLASSID=URI (location of implementation)
586 * ARCHIVE=CDATA (archive files)
587 * CODEBASE=URI (base URI for CLASSID, DATA, ARCHIVE)
588 * WIDTH=Length (object width)
589 * HEIGHT=Length (object height)
590 * NAME=CDATA (name for form submission)
591 * USEMAP=URI (client-side image map)
592 * TYPE=ContentType (content-type of object)
593 * CODETYPE=ContentType (content-type of code)
594 * STANDBY=Text (message to show while loading)
595 * TABINDEX=NUMBER (position in tabbing order)
596 * DECLARE (do not instantiate object)
597 * The rest is added as <param name="" value="" /> tags
599 function ImgObject($img, $url)
601 // get the url args: data="sample.svgz" type="image/svg+xml" width="400" height="300"
602 $params = explode(",", "id,width,height,data,classid,archive,codebase,name,usemap,type," .
603 "codetype,standby,tabindex,declare");
604 if (is_array($url)) {
607 foreach ($args as $attr => $value) {
608 foreach ($params as $param) {
609 if ($param == $attr) {
610 $img->setAttr($param, $value);
611 if (isset($found[$param])) $found[$param]++;
612 else $found[$param] = 1;
617 // now all remaining args are added as <param> to the object
619 foreach ($args as $attr => $value) {
620 if (!isset($found[$attr])) {
621 $params[] = HTML::param(array('name' => $attr,
625 $url = $img->getAttr('src');
626 $force_img = "png|jpg|gif|jpeg|bmp";
627 if (!preg_match("/\.(" . $force_img . ")/i", $url)) {
628 $img->setAttr('src', false);
631 $args = explode(' ', $url);
632 if (count($args) >= 1) {
633 $url = array_shift($args);
635 foreach ($args as $attr) {
636 foreach ($params as $param) {
637 if (preg_match("/^$param=(\S+)$/i", $attr, $m)) {
638 $img->setAttr($param, $m[1]);
639 if (isset($found[$param])) $found[$param]++;
640 else $found[$param] = 1;
645 // now all remaining args are added as <param> to the object
647 foreach ($args as $attr) {
648 if (!isset($found[$attr]) and preg_match("/^(\S+)=(\S+)$/i", $attr, $m)) {
649 $params[] = HTML::param(array('name' => $m[1],
655 $type = $img->getAttr('type');
657 if (file_exists($url)) {
658 $type = mime_content_type($url);
661 $object = HTML::object(array_merge($img->_attr,
662 array('type' => $type)), //'src' => $url
664 $object->setAttr('class', 'inlineobject');
666 foreach ($params as $param) $object->pushContent($param);
668 if (isBrowserSafari() and !isBrowserSafari(532)) { // recent chrome can do OBJECT
669 return HTML::embed($object->_attr, $object->_content);
671 $object->pushContent(HTML::embed($object->_attr));
679 $this->items = array();
685 $this->items[$this->size] = $item;
692 if ($this->size == 0) {
693 return false; // stack is empty
696 return $this->items[$this->size];
707 return $this->items[$this->size - 1];
714 // end class definition
716 function SplitQueryArgs($query_args = '')
718 // FIXME: use the arg-seperator which might not be &
719 $split_args = explode('&', $query_args);
721 while (list($key, $val) = each($split_args))
722 if (preg_match('/^ ([^=]+) =? (.*) /x', $val, $m))
723 $args[$m[1]] = $m[2];
727 function LinkPhpwikiURL($url, $text = '', $basepage = false)
731 if (!preg_match('/^ phpwiki: ([^?]*) [?]? (.*) $/x', $url, $m)) {
732 return HTML::span(array('class' => 'error'), _("BAD phpwiki: URL"));
736 $pagename = urldecode($m[1]);
739 if (empty($pagename) &&
740 preg_match('/^(diff|edit|links|info)=([^&]+)$/', $qargs, $m)
742 // Convert old style links (to not break diff links in
744 $pagename = urldecode($m[2]);
745 $args = array("action" => $m[1]);
747 $args = SplitQueryArgs($qargs);
750 if (empty($pagename))
751 $pagename = $GLOBALS['request']->getArg('pagename');
753 if (isset($args['action']) && $args['action'] == 'browse')
754 unset($args['action']);
757 if (empty($args['action']))
759 else if (is_safe_action($args['action']))
760 $class = 'wikiaction';
762 if (empty($args['action']) || is_safe_action($args['action']))
763 $class = 'wikiaction';
765 // Don't allow administrative links on unlocked pages.
766 $dbi = $GLOBALS['request']->getDbh();
767 $page = $dbi->getPage($basepage ? $basepage : $pagename);
768 if (!$page->get('locked'))
769 return HTML::span(array('class' => 'wikiunsafe'),
770 HTML::u(_("Lock page to enable link")));
771 $class = 'wikiadmin';
775 $text = HTML::span(array('class' => 'rawurl'), $url);
777 $wikipage = new WikiPageName($pagename);
778 if (!$wikipage->isValid()) {
780 return $WikiTheme->linkBadWikiWord($wikipage, $url);
783 return HTML::a(array('href' => WikiURL($pagename, $args),
789 * A class to assist in parsing wiki pagenames.
791 * Now with subpages and anchors, parsing and passing around
792 * pagenames is more complicated. This should help.
796 /** Short name for page.
798 * This is the value of $name passed to the constructor.
799 * (For use, e.g. as a default label for links to the page.)
803 /** The full page name.
805 * This is the full name of the page (without anchor).
811 * This is the referenced anchor within the page, or the empty string.
816 * @param mixed $name Page name.
817 * WikiDB_Page, WikiDB_PageRevision, or string.
818 * This can be a relative subpage name (like '/SubPage'),
819 * or can be the empty string to refer to the $basename.
821 * @param mixed $basename Page name from which to interpret
822 * relative or other non-fully-specified page names.
824 * @param mixed $anchor For links to anchors in page.
826 function __construct($name, $basename = false, $anchor = false)
828 if (is_string($name)) {
829 $this->shortName = $name;
830 if (strstr($name, ':')) {
831 list($moniker, $shortName) = explode(":", $name, 2);
832 $map = getInterwikiMap(); // allow overrides to custom maps
833 if (isset($map->_map[$moniker])) {
834 $url = $map->_map[$moniker];
835 if (strstr($url, '%s'))
836 $url = sprintf($url, $shortName);
840 // expand Talk or User, but not to absolute urls!
841 if (strstr($url, '//')) {
842 if ($moniker == 'Talk')
843 $name = $name . SUBPAGE_SEPARATOR . _("Discussion");
844 elseif ($moniker == 'User')
849 $this->shortName = $shortName;
852 // FIXME: We should really fix the cause for "/PageName" in the WikiDB
853 if ($name == '' or $name[0] == SUBPAGE_SEPARATOR) {
855 $name = $this->_pagename($basename) . $name;
857 $name = $this->_normalize_bad_pagename($name);
858 $this->shortName = $name;
862 $name = $this->_pagename($name);
863 $this->shortName = $name;
866 $this->name = $this->_check($name);
867 $this->anchor = (string)$anchor;
878 if (!($tail = strrchr($name, SUBPAGE_SEPARATOR)))
880 return substr($name, 0, -strlen($tail));
883 function isValid($strict = false)
886 return !isset($this->_errors);
887 return (is_string($this->name) and $this->name != '');
890 function getWarnings()
893 if (isset($this->_warnings))
894 $warnings = array_merge($warnings, $this->_warnings);
895 if (isset($this->_errors))
896 $warnings = array_merge($warnings, $this->_errors);
900 return sprintf(_("“%s”: Bad page name: %s"),
901 $this->shortName, join(', ', $warnings));
904 function _pagename($page)
906 if (isa($page, 'WikiDB_Page'))
907 return $page->getName();
908 elseif (isa($page, 'WikiDB_PageRevision'))
909 return $page->getPageName();
910 elseif (isa($page, 'WikiPageName'))
915 function _normalize_bad_pagename($name)
917 trigger_error("Bad pagename: " . $name, E_USER_WARNING);
919 // Punt... You really shouldn't get here.
922 return $request->getArg('pagename');
924 assert($name[0] == SUBPAGE_SEPARATOR);
925 $this->_errors[] = sprintf(_("Leading %s not allowed"), SUBPAGE_SEPARATOR);
926 return substr($name, 1);
930 * Compress internal white-space to single space character.
932 * This leads to problems with loading a foreign charset pagename,
933 * which cannot be deleted anymore, because unknown chars are compressed.
934 * So BEFORE importing a file _check must be done !!!
936 function _check($pagename)
938 // Compress internal white-space to single space character.
939 $pagename = preg_replace('/[\s\xa0]+/', ' ', $orig = $pagename);
940 if ($pagename != $orig)
941 $this->_warnings[] = _("White space converted to single space");
943 // Delete any control characters.
944 if (DATABASE_TYPE == 'cvs' or DATABASE_TYPE == 'file' or DATABASE_TYPE == 'flatfile') {
945 $pagename = preg_replace('/[\x00-\x1f\x7f\x80-\x9f]/', '', $orig = $pagename);
946 if ($pagename != $orig)
947 $this->_errors[] = _("Control characters not allowed");
950 // Strip leading and trailing white-space.
951 $pagename = trim($pagename);
954 while ($pagename and $pagename[0] == SUBPAGE_SEPARATOR)
955 $pagename = substr($pagename, 1);
956 if ($pagename != $orig)
957 $this->_errors[] = sprintf(_("Leading %s not allowed"), SUBPAGE_SEPARATOR);
959 // ";" is urlencoded, so safe from php arg-delim problems
960 /*if (strstr($pagename, ';')) {
961 $this->_warnings[] = _("';' is deprecated");
962 $pagename = str_replace(';', '', $pagename);
965 // not only for SQL, also to restrict url length
966 if (strlen($pagename) > MAX_PAGENAME_LENGTH) {
967 $pagename = substr($pagename, 0, MAX_PAGENAME_LENGTH);
968 $this->_errors[] = _("Page name too long");
971 // disallow some chars only on file and cvs
972 if ((DATABASE_TYPE == 'cvs'
973 or DATABASE_TYPE == 'file'
974 or DATABASE_TYPE == 'flatfile')
975 and preg_match('/(:|\.\.)/', $pagename, $m)
977 $this->_warnings[] = sprintf(_("Illegal chars %s removed"), $m[1]);
978 $pagename = str_replace('..', '', $pagename);
979 $pagename = str_replace(':', '', $pagename);
987 * Expand tabs in string.
989 * Converts all tabs to (the appropriate number of) spaces.
992 * @param integer $tab_width
995 function expand_tabs($str, $tab_width = 8)
997 $split = explode("\t", $str);
998 $tail = array_pop($split);
1000 foreach ($split as $hunk) {
1002 $pos = strlen(strrchr($expanded, "\n")) - 1;
1003 $expanded .= str_repeat(" ", ($tab_width - $pos % $tab_width));
1005 return substr($expanded, 1) . $tail;
1009 * Split WikiWords in page names.
1011 * It has been deemed useful to split WikiWords (into "Wiki Words") in
1012 * places like page titles. This is rumored to help search engines
1015 * @param $page string The page name.
1017 * @return string The split name.
1019 function SplitPagename($page)
1022 if (preg_match("/\s/", $page))
1023 return $page; // Already split --- don't split any more.
1025 // This algorithm is specialized for several languages.
1026 // (Thanks to Pierrick MEIGNEN)
1027 // Improvements for other languages welcome.
1030 // This mess splits between a lower-case letter followed by
1031 // either an upper-case or a numeral; except that it wont
1032 // split the prefixes 'Mc', 'De', or 'Di' off of their tails.
1033 switch ($GLOBALS['LANG']) {
1038 $RE[] = '/([[:lower:]])((?<!Mc|De|Di)[[:upper:]]|\d)/';
1041 $RE[] = '/([[:lower:]])((?<!Mc|Di)[[:upper:]]|\d)/';
1044 $sep = preg_quote(SUBPAGE_SEPARATOR, '/');
1045 // This the single-letter words 'I' and 'A' from any following
1046 // capitalized words.
1047 switch ($GLOBALS['LANG']) {
1049 $RE[] = "/(?<= |${sep}|^)([AI])([[:upper:]][[:lower:]])/";
1052 $RE[] = "/(?<= |${sep}|^)([À])([[:upper:]][[:lower:]])/";
1055 // Split at underscore
1056 $RE[] = '/(_)([[:alpha:]])/';
1057 $RE[] = '/([[:alpha:]])(_)/';
1058 // Split numerals from following letters.
1059 $RE[] = '/(\d)([[:alpha:]])/';
1060 // Split at subpage seperators. TBD in WikiTheme.php
1061 $RE[] = "/([^${sep}]+)(${sep})/";
1062 $RE[] = "/(${sep})([^${sep}]+)/";
1064 foreach ($RE as $key)
1068 foreach ($RE as $regexp) {
1069 $page = preg_replace($regexp, '\\1 \\2', $page);
1074 function NoSuchRevision(&$request, $page, $version)
1076 $html = HTML(HTML::h2(_("Revision Not Found")),
1077 HTML::p(fmt("I'm sorry. Version %d of %s is not in the database.",
1078 $version, WikiLink($page, 'auto'))));
1079 include_once 'lib/Template.php';
1080 GeneratePage($html, _("Bad Version"), $page->getCurrentRevision());
1085 * Get time offset for local time zone.
1087 * @param int $time Get offset for this time. Default: now.
1088 * @param bool $no_colon Don't put colon between hours and minutes.
1089 * @return string Offset as a string in the format +HH:MM.
1091 function TimezoneOffset($time = 0, $no_colon = false)
1095 $secs = date('Z', $time);
1103 $colon = $no_colon ? '' : ':';
1104 $mins = intval(($secs + 30) / 60);
1105 return sprintf("%s%02d%s%02d",
1106 $sign, $mins / 60, $colon, $mins % 60);
1110 * Format time in ISO-8601 format.
1112 * @param int $time Time. Default: now.
1113 * @return string Date and time in ISO-8601 format.
1115 function Iso8601DateTime($time = 0)
1119 $tzoff = TimezoneOffset($time);
1120 $date = date('Y-m-d', $time);
1121 $time = date('H:i:s', $time);
1122 return $date . 'T' . $time . $tzoff;
1126 * Format time in RFC-2822 format.
1128 * @param int $time Time. Default: now.
1129 * @return string Date and time in RFC-2822 format.
1131 function Rfc2822DateTime($time = 0)
1135 return date('D, j M Y H:i:s ', $time) . TimezoneOffset($time, 'no colon');
1139 * Format time in RFC-1123 format.
1141 * @param int $time Time. Default: now.
1142 * @return string Date and time in RFC-1123 format.
1144 function Rfc1123DateTime($time = 0)
1148 return gmdate('D, d M Y H:i:s \G\M\T', $time);
1151 /** Parse date in RFC-1123 format.
1153 * According to RFC 1123 we must accept dates in the following
1156 * Sun, 06 Nov 1994 08:49:37 GMT ; RFC 822, updated by RFC 1123
1157 * Sunday, 06-Nov-94 08:49:37 GMT ; RFC 850, obsoleted by RFC 1036
1158 * Sun Nov 6 08:49:37 1994 ; ANSI C's asctime() format
1160 * (Though we're only allowed to generate dates in the first format.)
1162 function ParseRfc1123DateTime($timestr)
1164 $timestr = trim($timestr);
1165 if (preg_match('/^ \w{3},\s* (\d{1,2}) \s* (\w{3}) \s* (\d{4}) \s*'
1166 . '(\d\d):(\d\d):(\d\d) \s* GMT $/ix',
1169 list(, $mday, $mon, $year, $hh, $mm, $ss) = $m;
1170 } elseif (preg_match('/^ \w+,\s* (\d{1,2})-(\w{3})-(\d{2}|\d{4}) \s*'
1171 . '(\d\d):(\d\d):(\d\d) \s* GMT $/ix',
1174 list(, $mday, $mon, $year, $hh, $mm, $ss) = $m;
1175 if ($year < 70) $year += 2000;
1176 elseif ($year < 100) $year += 1900;
1177 } elseif (preg_match('/^\w+\s* (\w{3}) \s* (\d{1,2}) \s*'
1178 . '(\d\d):(\d\d):(\d\d) \s* (\d{4})$/ix',
1181 list(, $mon, $mday, $hh, $mm, $ss, $year) = $m;
1187 $time = strtotime("$mday $mon $year ${hh}:${mm}:${ss} GMT");
1189 return false; // failed
1194 * Format time to standard 'ctime' format.
1196 * @param int $time Time. Default: now.
1197 * @return string Date and time.
1199 function CTime($time = 0)
1203 return date("D M j H:i:s Y", $time);
1207 * Format number as kibibytes or bytes.
1208 * Short format is used for PageList
1209 * Long format is used in PageInfo
1211 * @param $bytes int. Default: 0.
1212 * @param $longformat bool. Default: false.
1213 * @return FormattedText (XmlElement.php).
1215 function ByteFormatter($bytes = 0, $longformat = false)
1219 if ($bytes < 1024) {
1221 $size = fmt("%s B", $bytes);
1223 $size = fmt("%s bytes", $bytes);
1225 $kb = round($bytes / 1024, 1);
1227 $size = fmt("%s KiB", $kb);
1229 $size = fmt("%s KiB (%s bytes)", $kb, $bytes);
1235 * Internationalized printf.
1237 * This is essentially the same as PHP's built-in printf
1238 * with the following exceptions:
1240 * <li> It passes the format string through gettext().
1241 * <li> It supports the argument reordering extensions.
1248 * __printf("Differences between versions %s and %s of %s",
1249 * $new_link, $old_link, $page_link);
1252 * Then in locale/po/de.po, one can reorder the printf arguments:
1255 * msgid "Differences between %s and %s of %s."
1256 * msgstr "Der Unterschiedsergebnis von %3$s, zwischen %1$s und %2$s."
1259 * (Note that while PHP tries to expand $vars within double-quotes,
1260 * the values in msgstr undergo no such expansion, so the '$'s
1263 * One shouldn't use reordered arguments in the default format string.
1264 * Backslashes in the default string would be necessary to escape the
1265 * '$'s, and they'll cause all kinds of trouble....
1267 function __printf($fmt)
1269 $args = func_get_args();
1271 echo __vsprintf($fmt, $args);
1275 * Internationalized sprintf.
1277 * This is essentially the same as PHP's built-in printf with the
1278 * following exceptions:
1281 * <li> It passes the format string through gettext().
1282 * <li> It supports the argument reordering extensions.
1287 function __sprintf($fmt)
1289 $args = func_get_args();
1291 return __vsprintf($fmt, $args);
1295 * Internationalized vsprintf.
1297 * This is essentially the same as PHP's built-in printf with the
1298 * following exceptions:
1301 * <li> It passes the format string through gettext().
1302 * <li> It supports the argument reordering extensions.
1307 function __vsprintf($fmt, $args)
1309 $fmt = gettext($fmt);
1310 // PHP's sprintf doesn't support variable with specifiers,
1311 // like sprintf("%*s", 10, "x"); --- so we won't either.
1313 if (preg_match_all('/(?<!%)%(\d+)\$/x', $fmt, $m)) {
1314 // Format string has '%2$s' style argument reordering.
1315 // PHP doesn't support this.
1316 if (preg_match('/(?<!%)%[- ]?\d*[^- \d$]/x', $fmt))
1317 // literal variable name substitution only to keep locale
1318 // strings uncluttered
1319 trigger_error(sprintf(_("Can't mix “%s” with “%s” type format strings"),
1320 '%1\$s', '%s'), E_USER_WARNING); //php+locale error
1322 $fmt = preg_replace('/(?<!%)%\d+\$/x', '%', $fmt);
1325 // Reorder arguments appropriately.
1326 foreach ($m[1] as $argnum) {
1327 if ($argnum < 1 || $argnum > count($args))
1328 trigger_error(sprintf(_("%s: argument index out of range"),
1329 $argnum), E_USER_WARNING);
1330 $newargs[] = $args[$argnum - 1];
1335 // Not all PHP's have vsprintf, so...
1336 array_unshift($args, $fmt);
1337 return call_user_func_array('sprintf', $args);
1340 function file_mtime($filename)
1342 if ($stat = @stat($filename))
1348 function sort_file_mtime($a, $b)
1350 $ma = file_mtime($a);
1351 $mb = file_mtime($b);
1352 if (!$ma or !$mb or $ma == $mb) return 0;
1353 return ($ma > $mb) ? -1 : 1;
1359 * Build an array in $this->_fileList of files from $dirname.
1360 * Subdirectories are not traversed.
1362 * (This was a function LoadDir in lib/loadsave.php)
1363 * See also http://www.php.net/manual/en/function.readdir.php
1365 function getFiles($exclude = '', $sortby = '', $limit = '')
1367 $list = $this->_fileList;
1370 require_once 'lib/PageList.php';
1371 switch (Pagelist::sortby($sortby, 'db')) {
1372 case 'pagename ASC':
1374 case 'pagename DESC':
1375 $list = array_reverse($list);
1378 usort($list, 'sort_file_mtime');
1381 usort($list, 'sort_file_mtime');
1382 $list = array_reverse($list);
1387 return array_splice($list, 0, $limit);
1391 function _filenameSelector($filename)
1393 if (!$this->_pattern)
1396 if (!$this->_pcre_pattern)
1397 $this->_pcre_pattern = glob_to_pcre($this->_pattern);
1398 return preg_match('/' . $this->_pcre_pattern . ($this->_case ? '/' : '/i'),
1403 function fileSet($directory, $filepattern = false)
1405 $this->_fileList = array();
1406 $this->_pattern = $filepattern;
1408 $this->_pcre_pattern = glob_to_pcre($this->_pattern);
1410 $this->_case = !isWindows();
1411 $this->_pathsep = '/';
1413 if (empty($directory)) {
1414 trigger_error(sprintf(_("%s is empty."), 'directoryname'),
1416 return; // early return
1419 @ $dir_handle = opendir($dir = $directory);
1420 if (empty($dir_handle)) {
1421 trigger_error(sprintf(_("Unable to open directory “%s” for reading"),
1422 $dir), E_USER_NOTICE);
1423 return; // early return
1426 while ($filename = readdir($dir_handle)) {
1427 if ($filename[0] == '.' || filetype($dir . $this->_pathsep . $filename) != 'file')
1429 if ($this->_filenameSelector($filename)) {
1430 array_push($this->_fileList, "$filename");
1431 //trigger_error(sprintf(_("found file %s"), $filename),
1432 // E_USER_NOTICE); //debugging
1435 closedir($dir_handle);
1441 // expands a list containing regex's to its matching entries
1442 class ListRegexExpand
1444 public $match, $list, $index, $case_sensitive;
1445 function ListRegexExpand(&$list, $match, $case_sensitive = true)
1447 $this->match = $match;
1448 $this->list = &$list;
1449 $this->case_sensitive = $case_sensitive;
1450 //$this->index = false;
1453 function listMatchCallback($item, $key)
1455 $quoted = str_replace('/', '\/', $item);
1456 if (preg_match('/' . $this->match . ($this->case_sensitive ? '/' : '/i'),
1459 unset($this->list[$this->index]);
1460 $this->list[] = $item;
1464 function expandRegex($index, &$pages)
1466 $this->index = $index;
1467 array_walk($pages, array($this, 'listMatchCallback'));
1472 // Convert fileglob to regex style:
1473 // Convert some wildcards to pcre style, escape the rest
1474 // Escape . \\ + * ? [ ^ ] $ ( ) { } = ! < > | : /
1475 // Fixed bug #994994: "/" in $glob.
1476 function glob_to_pcre($glob)
1478 // check simple case: no need to escape
1479 $escape = '\[](){}=!<>|:/';
1480 if (strcspn($glob, $escape . ".+*?^$") == strlen($glob))
1482 // preg_replace cannot handle "\\\\\\2" so convert \\ to \xff
1483 $glob = strtr($glob, "\\", "\xff");
1484 $glob = str_replace("/", "\\/", $glob);
1485 // first convert some unescaped expressions to pcre style: . => \.
1487 $re = preg_replace('/([^\xff])?([' . preg_quote($special) . '])/',
1488 "\\1\xff\\2", $glob);
1491 $re = preg_replace('/([^\xff])?\*/', '$1.*', $re);
1492 $re = preg_replace('/([^\xff])?\?/', '$1.', $re);
1493 if (!preg_match('/^[\?\*]/', $glob))
1495 if (!preg_match('/[\?\*]$/', $glob))
1498 // Fixes Bug 1182997
1499 // .*? handled above, now escape the rest
1500 //while (strcspn($re, $escape) != strlen($re)) // loop strangely needed
1501 $re = preg_replace('/([^\xff])([' . preg_quote($escape, "/") . '])/',
1503 // Problem with 'Date/Time' => 'Date\/Time' => 'Date\xff\/Time' => 'Date\/Time'
1505 $re = preg_replace('/\xff/', '', $re);
1509 function glob_match($glob, $against, $case_sensitive = true)
1511 return preg_match('/' . glob_to_pcre($glob) . ($case_sensitive ? '/' : '/i'),
1515 function explodeList($input, $allnames, $glob_style = true, $case_sensitive = true)
1517 $list = explode(',', $input);
1518 // expand wildcards from list of $allnames
1519 if (preg_match('/[\?\*]/', $input)) {
1520 // Optimizing loop invariants:
1521 // http://phplens.com/lens/php-book/optimizing-debugging-php.php
1522 for ($i = 0, $max = sizeof($list); $i < $max; $i++) {
1524 if (preg_match('/[\?\*]/', $f)) {
1526 $expand = new ListRegexExpand($list,
1527 $glob_style ? glob_to_pcre($f) : $f, $case_sensitive);
1528 $expand->expandRegex($i, $allnames);
1535 // echo implode(":",explodeList("Test*",array("xx","Test1","Test2")));
1536 function explodePageList($input, $include_empty = false, $sortby = 'pagename',
1537 $limit = '', $exclude = '')
1539 include_once 'lib/PageList.php';
1540 return PageList::explodePageList($input, $include_empty, $sortby, $limit, $exclude);
1543 // Class introspections
1546 * Determine whether object is of a specified type.
1547 * In PHP builtin since 4.2.0 as is_a()
1548 * is_a() deprecated in PHP 5, in favor of instanceof operator
1549 * @param $object object An object.
1550 * @param $class string Class name.
1551 * @return bool True iff $object is a $class
1552 * or a sub-type of $class.
1554 function isa($object, $class)
1557 return is_object($object)
1558 && (strtolower(get_class($object)) == strtolower($class)
1559 || is_subclass_of($object, $lclass));
1562 /** Determine whether a function is okay to use.
1564 * Some providers (e.g. Lycos) disable some of PHP functions for
1565 * "security reasons." This makes those functions, of course,
1566 * unusable, despite the fact the function_exists() says they
1569 * This function test to see if a function exists and is not
1570 * disallowed by PHP's disable_functions config setting.
1572 * @param string $function_name Function name
1573 * @return bool True iff function can be used.
1575 function function_usable($function_name)
1578 if (!is_array($disabled)) {
1579 $disabled = array();
1580 // Use get_cfg_var since ini_get() is one of the disabled functions
1581 // (on Lycos, at least.)
1582 $split = preg_split('/\s*,\s*/', trim(get_cfg_var('disable_functions')));
1583 foreach ($split as $f)
1584 $disabled[strtolower($f)] = true;
1587 return (function_exists($function_name)
1588 and !isset($disabled[strtolower($function_name)])
1594 * This is used for generating ETags.
1596 function wikihash($x)
1598 if (is_scalar($x)) {
1600 } elseif (is_array($x)) {
1602 return md5(serialize($x));
1603 } elseif (is_object($x)) {
1606 trigger_error("Can't hash $x", E_USER_ERROR);
1610 function rand_ascii($length = 1)
1613 for ($i = 1; $i <= $length; $i++) {
1614 // return only typeable 7 bit ascii, avoid quotes
1615 $s .= chr(mt_rand(40, 126));
1620 /* by Dan Frankowski.
1622 function rand_ascii_readable($length = 6)
1624 // Pick a few random letters or numbers
1626 // Don't use 1lI0O, because they're hard to read
1627 $letters = "abcdefghijkmnopqrstuvwxyzABCDEFGHJKLMNPQRSTUVWXYZ23456789";
1628 $letter_len = strlen($letters);
1629 for ($i = 0; $i < $length; $i++) {
1630 $word .= $letters[mt_rand(0, $letter_len - 1)];
1636 * Recursively count all non-empty elements
1637 * in array of any dimension or mixed - i.e.
1638 * array('1' => 2, '2' => array('1' => 3, '2' => 4))
1639 * See http://www.php.net/manual/en/function.count.php
1641 function count_all($arg)
1643 // skip if argument is empty
1645 //print_r($arg); //debugging
1647 // not an array, return 1 (base case)
1648 if (!is_array($arg))
1650 // else call recursively for all elements $arg
1651 foreach ($arg as $key => $val)
1652 $count += count_all($val);
1658 function isSubPage($pagename)
1660 return (strstr($pagename, SUBPAGE_SEPARATOR));
1663 function subPageSlice($pagename, $pos)
1665 $pages = explode(SUBPAGE_SEPARATOR, $pagename);
1666 $pages = array_slice($pages, $pos, 1);
1670 function isActionPage($filename)
1673 global $AllActionPages;
1675 $localizedAllActionPages = array_map("__", $AllActionPages);
1677 return (in_array($filename, $localizedAllActionPages));
1683 * Class for "popping up" and alert box. (Except that right now, it doesn't
1687 * This is a hackish and needs to be refactored. However it would be nice to
1688 * unify all the different methods we use for showing Alerts and Dialogs.
1689 * (E.g. "Page deleted", login form, ...)
1694 * @param mixed $head Header ("title") for alert box.
1695 * @param mixed $body The text in the alert box.
1696 * @param array $buttons An array mapping button labels to URLs.
1697 * The default is a single "Okay" button pointing to $request->getURLtoSelf().
1699 function __construct($head, $body, $buttons = array())
1701 if (is_array($body)) {
1703 foreach ($body as $li) {
1704 $html->pushContent(HTML::li($li));
1708 $this->_tokens = array('HEADER' => $head, 'CONTENT' => $body);
1709 $this->_buttons = $buttons;
1713 * Show the alert box.
1719 $tokens = $this->_tokens;
1720 $tokens['BUTTONS'] = $this->_getButtons();
1722 $request->discardOutput();
1723 $tmpl = new Template('dialog', $request, $tokens);
1728 function _getButtons()
1732 $buttons = $this->_buttons;
1734 $buttons = array(_("OK") => $request->getURLtoSelf());
1737 foreach ($buttons as $label => $url)
1738 print "$label $url\n";
1739 $out[] = $WikiTheme->makeButton($label, $url, 'wikiaction');
1740 return new XmlContent($out);
1745 // 1.3.9-p1 => 1030.091
1746 // 1.3.10pre => 1030.099
1747 // 1.3.11pre-20041120 => 1030.1120041120
1748 // 1.3.12-rc1 => 1030.119
1749 function phpwiki_version()
1751 static $PHPWIKI_VERSION;
1752 if (!isset($PHPWIKI_VERSION)) {
1753 $arr = explode('.', preg_replace('/\D+$/', '', PHPWIKI_VERSION)); // remove the pre
1754 $arr[2] = preg_replace('/\.+/', '.', preg_replace('/\D/', '.', $arr[2]));
1755 $PHPWIKI_VERSION = $arr[0] * 1000 + $arr[1] * 10 + 0.01 * $arr[2];
1756 if (strstr(PHPWIKI_VERSION, 'pre') or strstr(PHPWIKI_VERSION, 'rc'))
1757 $PHPWIKI_VERSION -= 0.01;
1759 return $PHPWIKI_VERSION;
1762 function phpwiki_gzhandler($ob)
1764 $ob = gzencode($ob);
1765 $GLOBALS['request']->_ob_get_length = strlen($ob);
1766 if (!headers_sent()) {
1767 header(sprintf("Content-Length: %d", $GLOBALS['request']->_ob_get_length));
1772 function isWikiWord($word)
1774 global $WikiNameRegexp;
1775 //or preg_match('/\A' . $WikiNameRegexp . '\z/', $word) ??
1776 return preg_match("/^$WikiNameRegexp\$/", $word);
1779 // needed to store serialized objects-values only (perm, pref)
1780 function obj2hash($obj, $exclude = false, $fields = false)
1783 if (!$fields) $fields = get_object_vars($obj);
1784 foreach ($fields as $key => $val) {
1785 if (is_array($exclude)) {
1786 if (in_array($key, $exclude)) continue;
1794 * isAsciiString($string)
1796 function isAsciiString($s)
1798 $ptrASCII = '[\x00-\x7F]';
1799 return preg_match("/^($ptrASCII)*$/s", $s);
1803 * isUtf8String($string) - cheap utf-8 detection
1805 * segfaults for strings longer than 10kb!
1806 * Use http://www.phpdiscuss.com/article.php?id=565&group=php.i18n or
1807 * checkTitleEncoding() at http://cvs.sourceforge.net/viewcvs.py/wikipedia/phase3/languages/Language.php
1809 function isUtf8String($s)
1811 $ptrASCII = '[\x00-\x7F]';
1812 $ptr2Octet = '[\xC2-\xDF][\x80-\xBF]';
1813 $ptr3Octet = '[\xE0-\xEF][\x80-\xBF]{2}';
1814 $ptr4Octet = '[\xF0-\xF4][\x80-\xBF]{3}';
1815 $ptr5Octet = '[\xF8-\xFB][\x80-\xBF]{4}';
1816 $ptr6Octet = '[\xFC-\xFD][\x80-\xBF]{5}';
1817 return preg_match("/^($ptrASCII|$ptr2Octet|$ptr3Octet|$ptr4Octet|$ptr5Octet|$ptr6Octet)*$/s", $s);
1821 * Check for UTF-8 URLs; Internet Explorer produces these if you
1822 * type non-ASCII chars in the URL bar or follow unescaped links.
1823 * Requires urldecoded pagename.
1824 * Fixes sf.net bug #953949
1826 * src: languages/Language.php:checkTitleEncoding() from mediawiki
1828 function fixTitleEncoding($s)
1834 * Workaround for allow_url_fopen, to get the content of an external URI.
1835 * It returns the contents in one slurp. Parsers might want to check for allow_url_fopen
1836 * and use fopen, fread chunkwise. (see lib/XmlParser.php)
1838 function url_get_contents($uri)
1840 if (get_cfg_var('allow_url_fopen')) { // was ini_get('allow_url_fopen'))
1841 return @file_get_contents($uri);
1843 require_once 'lib/HttpClient.php';
1844 $bits = parse_url($uri);
1845 $host = $bits['host'];
1846 $port = isset($bits['port']) ? $bits['port'] : 80;
1847 $path = isset($bits['path']) ? $bits['path'] : '/';
1848 if (isset($bits['query'])) {
1849 $path .= '?' . $bits['query'];
1851 $client = new HttpClient($host, $port);
1852 $client->use_gzip = false;
1853 if (!$client->get($path)) {
1856 return $client->getContent();
1862 * Generate consecutively named strings:
1863 * Name, Name2, Name3, ...
1865 function GenerateId($name)
1867 static $ids = array();
1868 if (empty($ids[$name])) {
1873 return $name . $ids[$name];
1877 // from IncludePage. To be of general use.
1878 // content: string or array of strings
1879 function firstNWordsOfContent($n, $content)
1881 if ($content and $n > 0) {
1882 if (is_array($content)) {
1883 // fixme: return a list of lines then?
1884 //$content = join("\n", $content);
1885 //$return_array = true;
1887 foreach ($content as $line) {
1888 $words = explode(' ', $line);
1889 if ($wordcount + count($words) > $n) {
1890 $new[] = implode(' ', array_slice($words, 0, $n - $wordcount))
1891 . sprintf(_("... (first %s words)"), $n);
1894 $wordcount += count($words);
1900 // fixme: use better whitespace/word seperators
1901 $words = explode(' ', $content);
1902 if (count($words) > $n) {
1903 return join(' ', array_slice($words, 0, $n))
1904 . sprintf(_("... (first %s words)"), $n);
1914 // moved from lib/plugin/IncludePage.php
1915 function extractSection($section, $content, $page, $quiet = false, $sectionhead = false)
1917 $qsection = preg_replace('/\s+/', '\s+', preg_quote($section, '/'));
1919 if (preg_match("/ ^(!{1,}|={2,})\\s*$qsection\s*=*" // section header
1920 . " \\s*$\\n?" // possible blank lines
1921 . " ( (?: ^.*\\n? )*? )" // some lines
1922 . " (?= ^\\1 | \\Z)/xm", // sec header (same or higher level) (or EOF)
1923 implode("\n", $content),
1926 // Strip trailing blanks lines and ---- <hr>s
1927 $text = preg_replace("/\\s*^-{4,}\\s*$/m", "", $match[2]);
1929 $text = $match[1] . $section . "\n" . $text;
1930 return explode("\n", $text);
1933 $mesg = $page . " " . $section;
1936 return array(sprintf(_("<%s: no such section>"), $mesg));
1939 // Extract the first $sections sections of the page
1940 function extractSections($sections, $content, $page, $quiet = false, $sectionhead = false)
1943 $mycontent = $content;
1946 while ($sections > 0) {
1948 if (preg_match("/ ^(!{1,}|={2,})\\s*(.*)\\n" // section header
1949 . " \\s*$\\n?" // possible blank lines
1950 . " ( (?: ^.*\\n? )*? )" // some lines
1951 . " ( ^\\1 (.|\\n)* | \\Z)/xm", // sec header (same or higher level) (or EOF)
1952 implode("\n", $mycontent),
1955 $section = $match[2];
1956 // Strip trailing blanks lines and ---- <hr>s
1957 $text = preg_replace("/\\s*^-{4,}\\s*$/m", "", $match[3]);
1959 $text = $match[1] . $section . "\n" . $text;
1962 $mycontent = explode("\n", $match[4]);
1964 if ($sections === 0) {
1965 return explode("\n", $result);
1972 // use this faster version: only load ExternalReferrer if we came from an external referrer
1973 function isExternalReferrer(&$request)
1975 if ($referrer = $request->get('HTTP_REFERER')) {
1976 $home = SERVER_URL; // SERVER_URL or SCRIPT_NAME, if we want to check sister wiki's also
1977 if (string_starts_with(strtolower($referrer), strtolower($home))) return false;
1978 require_once 'lib/ExternalReferrer.php';
1979 $se = new SearchEngines();
1980 return $se->parseSearchQuery($referrer);
1982 //if (DEBUG) return array('query' => 'wiki');
1987 * Useful for PECL overrides: cvsclient, ldap, soap, xmlrpc, pdo, pdo_<driver>
1989 function loadPhpExtension($extension)
1991 if (!extension_loaded($extension)) {
1992 $isWindows = (substr(PHP_OS, 0, 3) == 'WIN');
1993 $soname = ($isWindows ? 'php_' : '')
1995 . ($isWindows ? '.dll' : '.so');
1999 return extension_loaded($extension);
2002 function string_starts_with($string, $prefix)
2004 return (substr($string, 0, strlen($prefix)) == $prefix);
2007 function string_ends_with($string, $suffix)
2009 return (substr($string, -strlen($suffix)) == $suffix);
2012 function array_remove($arr, $value)
2014 return array_values(array_diff($arr, array($value)));
2018 * Ensure that the script will have another $secs time left.
2019 * Works only if safe_mode is off.
2020 * For example not to timeout on waiting socket connections.
2021 * Use the socket timeout as arg.
2023 function longer_timeout($secs = 30)
2025 $timeout = @ini_get("max_execution_time") ? ini_get("max_execution_time") : 30;
2026 $timeleft = $timeout - $GLOBALS['RUNTIMER']->getTime();
2027 if ($timeleft < $secs)
2028 @set_time_limit(max($timeout, (integer)($secs + $timeleft)));
2031 function printSimpleTrace($bt)
2033 echo "\nTraceback:\n";
2034 debug_print_backtrace();
2038 * Return the used process memory, in bytes.
2040 function getMemoryUsage()
2042 return memory_get_usage();
2046 * @param var $needle
2047 * @param array $haystack one-dimensional numeric array only, no hash
2049 * @desc Feed a sorted array to $haystack and a value to search for to $needle.
2050 It will return false if not found or the index where it was found.
2051 From dennis.decoene@moveit.be http://www.php.net/array_search
2053 function binary_search($needle, $haystack)
2055 $high = count($haystack);
2058 while (($high - $low) > 1) {
2059 $probe = floor(($high + $low) / 2);
2060 if ($haystack[$probe] < $needle) {
2062 } elseif ($haystack[$probe] == $needle) {
2063 $high = $low = $probe;
2069 if ($high == count($haystack) || $haystack[$high] != $needle) {
2076 function is_localhost()
2078 return $_SERVER['SERVER_ADDR'] == '127.0.0.1';
2082 * Take a string and quote it sufficiently to be passed as a Javascript
2083 * string between ''s
2085 function javascript_quote_string($s)
2087 return str_replace("'", "\'", $s);
2090 function isSerialized($s)
2092 return (!empty($s) and (strlen($s) > 3) and (substr($s, 1, 1) == ':'));
2096 * Determine if a variable represents a whole number
2099 function is_whole_number($var)
2101 return (is_numeric($var) && (intval($var) == floatval($var)));
2105 * Take a string and return an array of pairs (attribute name, attribute value)
2107 * We allow attributes with or without double quotes (")
2108 * Attribute-value pairs may be separated by space or comma
2109 * Space is normal HTML attributes, comma is for RichTable compatibility
2110 * border=1, cellpadding="5"
2111 * border=1 cellpadding="5"
2112 * style="font-family: sans-serif; border-top:1px solid #dddddd;"
2113 * style="font-family: Verdana, Arial, Helvetica, sans-serif"
2115 function parse_attributes($line)
2120 if (empty($line)) return $options;
2121 $line = trim($line);
2122 if (empty($line)) return $options;
2123 $line = trim($line, ",");
2124 if (empty($line)) return $options;
2126 // First we have an attribute name.
2131 while (($i < strlen($line)) && ($line[$i] != '=')) {
2134 $attribute = substr($line, 0, $i);
2135 $attribute = strtolower($attribute);
2137 $line = substr($line, $i + 1);
2138 $line = trim($line);
2139 $line = trim($line, "=");
2140 $line = trim($line);
2142 if (empty($line)) return $options;
2144 // Then we have the attribute value.
2147 // Attribute value might be between double quotes
2148 // In that case we have to find the closing double quote
2149 if ($line[0] == '"') {
2150 $i++; // skip first '"'
2151 while (($i < strlen($line)) && ($line[$i] != '"')) {
2154 $value = substr($line, 0, $i);
2155 $value = trim($value, '"');
2156 $value = trim($value);
2158 // If there are no double quotes, we have to find the next space or comma
2160 while (($i < strlen($line)) && (($line[$i] != ' ') && ($line[$i] != ','))) {
2163 $value = substr($line, 0, $i);
2164 $value = trim($value);
2165 $value = trim($value, ",");
2166 $value = trim($value);
2169 $options[$attribute] = $value;
2171 $line = substr($line, $i + 1);
2172 $line = trim($line);
2173 $line = trim($line, ",");
2174 $line = trim($line);
2176 return $options + parse_attributes($line);
2180 * Returns true if the filename ends with an image suffix.
2181 * Uses INLINE_IMAGES if defined, else "png|jpg|jpeg|gif|swf"
2183 function is_image($filename)
2186 if (defined('INLINE_IMAGES')) {
2187 $inline_images = INLINE_IMAGES;
2189 $inline_images = "png|jpg|jpeg|gif|swf";
2192 foreach (explode("|", $inline_images) as $suffix) {
2193 if (string_ends_with(strtolower($filename), "." . $suffix)) {
2201 * Returns true if the filename ends with an video suffix.
2202 * Currently only FLV and OGG
2204 function is_video($filename)
2207 return string_ends_with(strtolower($filename), ".flv")
2208 or string_ends_with(strtolower($filename), ".ogg");
2212 * Remove accents from given text.
2214 function strip_accents($text)
2216 $res = utf8_decode($text);
2218 utf8_decode('àáâãäçèéêëìíîïñòóôõöùúûüýÿÀÁÂÃÄÇÈÉÊËÌÍÎÏÑÒÓÔÕÖÙÚÛÜÝ'),
2219 'aaaaaceeeeiiiinooooouuuuyyAAAAACEEEEIIIINOOOOOUUUUY');
2220 return utf8_encode($res);
2226 // c-basic-offset: 4
2227 // c-hanging-comment-ender-p: nil
2228 // indent-tabs-mode: nil