Backport
[banana.git] / banana / message.func.inc.php
CommitLineData
7027794f 1<?php
2/********************************************************************************
3 * * banana/message.func.inc.php : function to display messages
4 * * ------------------------
5 * *
6 * * This file is part of the banana distribution
7 * * Copyright: See COPYING files that comes with this distribution
8 * ********************************************************************************/
9
10require_once dirname(__FILE__) . '/mimepart.inc.php';
11require_once dirname(__FILE__) . '/banana.inc.php';
12
13// {{{ Plain Text Functions
14
15function banana_isFlowed($line)
16{
17 return ctype_space(substr($line, -1)) && $line != '-- ';
18}
19
20function banana_removeQuotes($line, &$quote_level, $strict = true)
21{
22 $quote_level = 0;
23 if (empty($line)) {
24 return '';
25 }
26 while ($line{0} == '>') {
27 $line = substr($line, 1);
28 if (!$strict && ctype_space($line{0})) {
29 $line = substr($line, 1);
30 }
31 $quote_level++;
32 }
33 if (ctype_space($line{0})) {
34 $line = substr($line, 1);
35 }
36 return $line;
37}
38
39function banana_quote($line, $level, $mark = '>')
40{
41 $lines = explode("\n", $line);
b18124be 42 $quote = str_repeat($mark, $level);
7027794f 43 foreach ($lines as &$line) {
b18124be 44 $line = $quote . $line;
7027794f 45 }
46 return implode("\n", $lines);
47}
48
49function banana_unflowed($text)
50{
51 $lines = explode("\n", $text);
52 $text = '';
53 while (!is_null($line = array_shift($lines))) {
54 $level = 0;
55 $line = banana_removeQuotes($line, $level);
56 while (banana_isFlowed($line)) {
57 $lvl = 0;
b18124be 58 if (empty($lines)) {
7027794f 59 break;
60 }
b18124be 61 $nl = $lines[0];
7027794f 62 $nl = banana_removeQuotes($nl, $lvl);
b18124be 63 if ($lvl == $level) {
64 $line .= $nl;
65 array_shift($lines);
66 } else {
67 break;
68 }
7027794f 69 }
70 $text .= banana_quote($line, $level) . "\n";
71 }
72 return $text;
73}
74
75function banana_wordwrap($text, $quote_level)
76{
77 if ($quote_level > 0) {
e9360b11 78 $length = Banana::$msgshow_wrap - $quote_level - 1;
7027794f 79 return banana_quote(wordwrap($text, $length), $quote_level);
80
81 }
e9360b11 82 return wordwrap($text, Banana::$msgshow_wrap);
7027794f 83}
84
85function banana_catchFormats($text)
86{
87 $formatting = Array('/' => 'em', // match / first in order not to match closing markups </...> <> </>
88 '_' => 'u',
89 '*' => 'strong');
e9360b11 90 $url = Banana::$msgshow_url;
598a1c53 91 preg_match_all("/$url/ui", $text, $urls);
7027794f 92 $text = str_replace($urls[0], "&&&urls&&&", $text);
93 foreach ($formatting as $limit=>$mark) {
94 $limit = preg_quote($limit, '/');
fd57a15c 95 $text = preg_replace('/' . $limit . '(\S+?)' . $limit . '/us',
7027794f 96 "<$mark>\\1</$mark>", $text);
97 }
98 return preg_replace('/&&&urls&&&/e', 'array_shift($urls[0])', $text);
99}
100
101// {{{ URL Catcher tools
102
103function banana__cutlink($link)
104{
105 $link = banana_html_entity_decode($link, ENT_QUOTES);
e9360b11 106 if (strlen($link) > Banana::$msgshow_wrap) {
107 $link = substr($link, 0, Banana::$msgshow_wrap - 3) . "...";
7027794f 108 }
109 return banana_htmlentities($link, ENT_QUOTES);
110}
111
112function banana__cleanURL($url)
113{
114 $url = str_replace('@', '%40', $url);
115 if (strpos($url, '://') === false) {
116 $url = 'http://' . $url;
117 }
118 return '<a href="'.$url.'" title="'.$url.'">' . banana__cutlink($url) . '</a>';
119}
120
121function banana__catchMailLink($email)
122{
123 $mid = '<' . $email . '>';
124 if (isset(Banana::$spool->ids[$mid])) {
125 return Banana::$page->makeLink(Array('group' => Banana::$group,
126 'artid' => Banana::$spool->ids[$mid],
127 'text' => $email));
128 } elseif (strpos($email, '$') !== false) {
129 return $email;
130 }
131 return '<a href="mailto:' . $email . '">' . $email . '</a>';
132}
133
134// }}}
135
136function banana_catchURLs($text)
137{
e9360b11 138 $url = Banana::$msgshow_url;
7027794f 139
140 $res = preg_replace("/&(lt|gt|quot);/", " &\\1; ", $text);
598a1c53 141 $res = preg_replace("/$url/uie", "'\\1'.banana__cleanurl('\\2').'\\3'", $res);
7027794f 142 $res = preg_replace('/(["\[])?(?:mailto:|news:)?([a-z0-9.\-+_\$]+@([\-.+_]?[a-z0-9])+)(["\]])?/ie',
143 "'\\1' . banana__catchMailLink('\\2') . '\\4'",
144 $res);
145 $res = preg_replace("/ &(lt|gt|quot); /", "&\\1;", $res);
146 return $res;
147}
148
149// {{{ Quotes catcher functions
150
151function banana__replaceQuotes($text, $regexp)
152{
153 return stripslashes(preg_replace("@(^|<pre>|\n)$regexp@i", '\1', $text));
154}
155
156// }}}
157
158function banana_catchQuotes($res, $strict = true)
159{
160 if ($strict) {
161 $regexp = "&gt;";
162 } else {
163 $regexp = "&gt; *";
164 }
165 while (preg_match("/(^|<pre>|\n)$regexp/i", $res)) {
166 $res = preg_replace("/(^|<pre>|\n)(($regexp.*(?:\n|$))+)/ie",
167 "'\\1</pre><blockquote><pre>'"
168 ." . banana__replaceQuotes('\\2', '$regexp')"
169 ." . '</pre></blockquote><pre>'",
170 $res);
171 }
172 return $res;
173}
174
175function banana_catchSignature($res)
176{
177 $res = preg_replace("@<pre>-- ?\n@", "<pre>\n-- \n", $res);
178 $parts = preg_split("/\n-- ?\n/", $res);
179 $sign = '</pre><hr style="width: 100%; margin: 1em 0em; " /><pre>';
180 return join($sign, $parts);
181}
182
183function banana_plainTextToHtml($text, $strict = true)
184{
185 $text = banana_htmlentities($text);
186 $text = banana_catchFormats($text);
187 $text = banana_catchURLs($text);
188 $text = banana_catchQuotes($text, $strict);
189 $text = banana_catchSignature($text);
190 return banana_cleanHtml('<pre>' . $text . '</pre>');
191}
192
193function banana_wrap($text, $base_level = 0, $strict = true)
194{
195 $lines = explode("\n", $text);
196 $text = '';
197 $buffer = array();
198 $level = 0;
199 while (!is_null($line = array_shift($lines))) {
200 $lvl = 0;
201 $line = banana_removeQuotes($line, $lvl, $strict);
b18124be 202 if($lvl != $level) {
203 if (!empty($buffer)) {
204 $text .= banana_wordwrap(implode("\n", $buffer), $level + $base_level) . "\n";
205 $buffer = array();
206 }
7027794f 207 $level = $lvl;
7027794f 208 }
209 $buffer[] = $line;
210 }
211 if (!empty($buffer)) {
212 $text .= banana_wordwrap(implode("\n", $buffer), $level + $base_level);
213 }
214 return $text;
215}
216
217function banana_formatPlainText(BananaMimePart &$part, $base_level = 0)
218{
219 $text = $part->getText();
220 if ($part->isFlowed()) {
221 $text = banana_unflowed($text);
222 }
223 $text = banana_wrap($text, $base_level, $part->isFlowed());
224 return banana_plainTextToHtml($text, $part->isFlowed());
225}
226
227function banana_quotePlainText(BananaMimePart &$part)
228{
229 $text = $part->getText();
230 if ($part->isFlowed()) {
231 $text = banana_unflowed($text);
232 }
233 return banana_wrap($text, 1);
234}
235
236// }}}
237// {{{ HTML Functions
238
239function banana_htmlentities($text, $quote = ENT_COMPAT)
240{
241 return htmlentities($text, $quote, 'UTF-8');
242}
243
244function banana_html_entity_decode($text, $quote = ENT_COMPAT)
245{
246 return html_entity_decode($text, $quote, 'UTF-8');
247}
248
249function banana_removeEvilAttributes($tagSource)
250{
251 $stripAttrib = 'javascript:|onclick|ondblclick|onmousedown|onmouseup|onmouseover|'.
252 'onmousemove|onmouseout|onkeypress|onkeydown|onkeyup';
253 return stripslashes(preg_replace("/$stripAttrib/i", '', $tagSource));
9c118ac9 254}
255
256function banana_cleanStyles($tag, $attributes)
257{
258 static $td_style, $conv, $size_conv;
259 if (!isset($td_style)) {
260 $conv = array('style' => 'style', 'width' => 'width', 'height' => 'height', 'border' => 'border-size',
261 'size' => 'font-size', 'align' => 'text-align', 'valign' => 'vertical-align', 'face' => 'font',
262 'bgcolor' => 'background-color', 'color' => 'color', 'style' => 'style',
263 'cellpadding' => 'padding', 'cellspacing' => 'border-spacing');
264 $size_conv = array(1 => 'xx-small', 2 => 'x-small', 3 => 'small', 4 => 'medium', 5 => 'large',
265 6 => 'x-large', 7 => 'xx-large',
266 '-2' => 'xx-small', '-1' => 'x-small', '+1' => 'medium', '+2' => 'large',
267 '+3' => 'x-large', '+4' => 'xx-large');
268 $td_style = array();
269 }
270 if ($tag == 'table') {
271 array_unshift($td_style, '');
272 }
273 if ($tag == '/table') {
274 array_shift($td_style);
275 }
276 if ($tag{0} == '/') {
277 return '';
278 }
279 if ($tag == 'td') {
280 $style = $td_style[0];
281 } else {
282 $style = '';
283 }
284 $attributes = str_replace("\n", ' ', stripslashes($attributes));
285 $attributes = str_replace('= "', '="', $attributes);
286 foreach ($conv as $att=>$stl) {
287 $pattern = '/\b' . preg_quote($att, '/') . '="(.+?)"/i';
288 if (preg_match($pattern, $attributes, $matches)) {
289 $attributes = preg_replace($pattern, '', $attributes);
290 $val = $matches[1];
291 if ($att == 'cellspacing' && strpos($style, 'border-collapse') === false) {
292 $style .= "border-collapse: separate; border-spacing: $val $val; ";
293 } elseif ($att == 'cellpadding' && $tag == 'table') {
294 $td_style[0] = "$stl: {$val}px; ";
295 } elseif ($att == 'style') {
296 $val = rtrim($val, ' ;');
297 $style .= "$val; ";
298 } elseif ($att == 'size') {
299 $val = $size_conv[$val];
300 $style .= "$stl: $val; ";
301 } elseif (is_numeric($val)) {
302 $style .= "$stl: {$val}px; ";
303 } else {
304 $style .= "$stl: $val; ";
305 }
306 }
307 }
308 if (!empty($style)) {
309 $style = 'style="' . $style . '" ';
310 }
311 return ' ' . $style . trim($attributes);
312}
e67c2c1c 313
314function banana_filterCss($css)
315{
316 $css = preg_replace("/(^|\n|,)\s*(\w+[^\{\}\<]+\{)/s", '\1.banana .message .body .html \2', $css);
317 $css = preg_replace('/ body\b/i', '', $css);
318 if (!Banana::$msgshow_externalimages) {
319 if (preg_match("/url\(((ht|f)tps?:.*?)\)/i", $css)) {
320 $css = preg_replace("/url\(((ht|f)tps?:.*?)\)/i", 'url(invalid-image.png)', $css);
321 Banana::$msgshow_hasextimages = true;
322 }
323 }
324 return $css;
325}
7027794f 326
327/**
328 * @return string
329 * @param string
330 * @desc Strip forbidden tags and delegate tag-source check to removeEvilAttributes()
331 */
d69a4629 332function banana_cleanHtml($source, $to_xhtml = false)
7027794f 333{
7027794f 334 if (function_exists('tidy_repair_string')) {
335 $tidy_on = Array(
336 'drop-empty-paras', 'drop-proprietary-attributes',
337 'hide-comments', 'logical-emphasis', 'output-xhtml',
9c118ac9 338 'replace-color',
7027794f 339 );
9c118ac9 340 $tidy_off = Array('join-classes', 'clean', 'show-body-only'); // 'clean' may be a good idea, but it is too aggressive
7027794f 341
342 foreach($tidy_on as $opt) {
343 tidy_setopt($opt, true);
344 }
345 foreach($tidy_off as $opt) {
346 tidy_setopt($opt, false);
347 }
348 tidy_setopt('alt-text', '[ inserted by TIDY ]');
349 tidy_setopt('wrap', '120');
350 tidy_set_encoding('utf8');
9c118ac9 351 $source = tidy_repair_string($source);
352 }
353
354 // To XHTML
d69a4629 355 if ($to_xhtml) {
356 // catch inline CSS
357 $css = null;
358 if (preg_match('/<head.*?>(.*?)<\/head>/is', $source, $matches)) {
359 $source = preg_replace('/<head.*?>.*?<\/head>/is', '', $source);
360 preg_match_all('/<style.*?type="text\/css".*?>(.*?)<\/style>/is', $matches[1], $matches);
361 foreach ($matches[1] as &$match) {
362 $css .= $match;
363 }
e67c2c1c 364 $css = banana_filterCss($css);
d69a4629 365 Banana::$page->addCssInline($css);
9c118ac9 366 }
9c118ac9 367
d69a4629 368 // clean DTD
369 $source = str_replace('<font', '<span', $source);
370 $source = preg_replace('/<u\b/', '<span style="text-decoration: underline"', $source);
371 $source = preg_replace('/<\/(font|u)>/', '</span>', $source);
372 $source = str_replace('<body', $css ? '<div class="html"' : '<div class="html default"', $source);
373 $source = str_replace('</body>', '</div>', $source);
374 }
9c118ac9 375 $allowedTags = '<h1><h2><h3><b><i><a><ul><li><pre><hr><blockquote><img><br><div><span>'
376 . '<p><small><big><sup><sub><code><em><strong><table><tr><td><th>';
377 $source = strip_tags($source, $allowedTags);
378
379 // Use inlined style instead of old html attributes
d69a4629 380 if ($to_xhtml) {
381 $source = preg_replace('/<(\/?\w+)(.*?)(\/?>)/ise', "'<\\1' . banana_cleanStyles('\\1', '\\2') . '\\3'", $source);
382 }
9c118ac9 383 return preg_replace('/<(.*?)>/ie', "'<'.banana_removeEvilAttributes('\\1').'>'", $source);
7027794f 384}
385
386function banana_catchHtmlSignature($res)
387{
388 $res = preg_replace("@(</p>)\n?-- ?\n?(<p[^>]*>|<br[^>]*>)@", "\\1<br/>-- \\2", $res);
389 $res = preg_replace("@<br[^>]*>\n?-- ?\n?(<p[^>]*>)@", "<br/>-- <br/>\\2", $res);
390 $res = preg_replace("@(<pre[^>]*>)\n?-- ?\n@", "<br/>-- <br/>\\1", $res);
391 $parts = preg_split("@(:?<p[^>]*>\n?-- ?\n?</p>|<br[^>]*>\n?-- ?\n?<br[^>]*>)@", $res);
392 $sign = '<hr style="width: 100%; margin: 1em 0em; " />';
393 return join($sign, $parts);
394}
395
396// {{{ Link to part catcher tools
397
398function banana__linkAttachment($cid)
399{
400 return banana_htmlentities(
401 Banana::$page->makeUrl(Array('group' => Banana::$group,
402 'artid' => Banana::$artid,
403 'part' => $cid)));
404}
405
406// }}}
407
408function banana_hideExternalImages($text)
409{
e67c2c1c 410 if (preg_match("/<img([^>]*?)src=['\"](?!cid).*?['\"](.*?)>/i", $text)) {
411 Banana::$msgshow_hasextimages = true;
412 return preg_replace("/<img([^>]*?)src=['\"](?!cid).*?['\"](.*?)>/i",
413 '<img\1src="invalid"\2>',
414 $text);
415 }
416 return $text;
7027794f 417}
418
419function banana_catchPartLinks($text)
420{
9c118ac9 421 $article = Banana::$page->makeURL(array('group' => Banana::$group, 'artid' => Banana::$artid, 'part' => Banana::$part));
422 $article = banana_htmlentities($article);
423 $text = preg_replace('/cid:([^\'" ]+)/e', "banana__linkAttachment('\\1')", $text);
424 $text = preg_replace('/href="(#.*?)"/i', 'href="' . $article . '\1"', $text);
425 return $text;
7027794f 426}
427
428// {{{ HTML to Plain Text tools
429
430function banana__convertFormats($res)
431{
432 $table = array('em|i' => '/',
433 'strong|b' => '*',
434 'u' => '_');
435 foreach ($table as $tags=>$format) {
436 $res = preg_replace("!</?($tags)( .*?)?>!is", $format, $res);
437 }
438 return $res;
439}
440
441function banana__convertQuotes($res)
442{
443 return preg_replace('!<blockquote.*?>([^<]*)</blockquote>!ies',
444 "\"\n\" . banana_quote(banana__convertQuotes('\\1' . \"\n\"), 1, '&gt;')",
445 $res);
446}
447
448// }}}
449
450function banana_htmlToPlainText($res)
451{
452 $res = str_replace("\n", '', $res);
453 $res = banana__convertFormats($res);
454 $res = trim(strip_tags($res, '<div><br><p><blockquote>'));
455 $res = preg_replace("@</?(br|p|div).*?>@si", "\n", $res);
456 $res = banana__convertQuotes($res);
457 return banana_html_entity_decode($res);
458}
459
460function banana_formatHtml(BananaMimePart &$part)
461{
462 $text = $part->getText();
463 $text = banana_catchHtmlSignature($text);
57efc445 464 if (!Banana::$msgshow_externalimages) {
465 $text = banana_hideExternalImages($text);
466 }
7027794f 467 $text = banana_catchPartLinks($text);
d69a4629 468 return banana_cleanHtml($text, true);
7027794f 469}
470
471function banana_quoteHtml(BananaMimePart &$part)
472{
473 $text = $part->getText();
474 $text = banana_htmlToPlainText($text);
475 return banana_wrap($text, 1);
476}
477
478// }}}
479// {{{ Richtext Functions
480
481/** Convert richtext to html
482 */
483function banana_richtextToHtml($source)
484{
485 $tags = Array('bold' => 'b',
486 'italic' => 'i',
487 'smaller' => 'small',
488 'bigger' => 'big',
489 'underline' => 'u',
490 'subscript' => 'sub',
491 'superscript' => 'sup',
492 'excerpt' => 'blockquote',
493 'paragraph' => 'p',
494 'nl' => 'br'
495 );
496
497 // clean unsupported tags
498 $protectedTags = '<signature><lt><comment><'.join('><', array_keys($tags)).'>';
499 $source = strip_tags($source, $protectedTags);
500
501 // convert richtext tags to html
502 foreach (array_keys($tags) as $tag) {
503 $source = preg_replace('@(</?)'.$tag.'([^>]*>)@i', '\1'.$tags[$tag].'\2', $source);
504 }
505
506 // some special cases
507 $source = preg_replace('@<signature>@i', '<br>-- <br>', $source);
508 $source = preg_replace('@</signature>@i', '', $source);
509 $source = preg_replace('@<lt>@i', '&lt;', $source);
510 $source = preg_replace('@<comment[^>]*>((?:[^<]|<(?!/comment>))*)</comment>@i', '<!-- \1 -->', $source);
511 return banana_cleanHtml($source);
512}
513
514function banana_formatRichText(BananaMimePart &$part)
515{
516 $text = $part->getText();
517 $text = banana_richtextToHtml($text);
518 $text = banana_catchHtmlSignature($text);
519 return banana_cleanHtml($text);
520}
521
3c3a3ce3 522function banana_quoteRichtText(BananaMimePart &$part)
523{
524 $text = $part->getText();
525 $text = banana_richtextToHtml($text);
526 $text = banana_htmlToPlainText($text);
527 return banana_wrap($text, 1);
528}
529
7027794f 530// }}}
531
598a1c53 532// vim:set et sw=4 sts=4 ts=4 enc=utf-8:
7027794f 533?>