blob: 20bf32335b65d55fd16b6e885991269c3c379d8b [file] [log] [blame]
Derek Allard3d879d52008-01-18 19:41:32 +00001<?php if (!defined('BASEPATH')) exit('No direct script access allowed');
2/**
3 * CodeIgniter
4 *
5 * An open source application development framework for PHP 4.3.2 or newer
6 *
7 * @package CodeIgniter
8 * @author ExpressionEngine Dev Team
9 * @copyright Copyright (c) 2006, EllisLab, Inc.
Derek Jones7a9193a2008-01-21 18:39:20 +000010 * @license http://codeigniter.com/user_guide/license.html
11 * @link http://codeigniter.com
Derek Allard3d879d52008-01-18 19:41:32 +000012 * @since Version 1.0
13 * @filesource
14 */
15
16// ------------------------------------------------------------------------
17
18/**
19 * CodeIgniter Text Helpers
20 *
21 * @package CodeIgniter
22 * @subpackage Helpers
23 * @category Helpers
24 * @author ExpressionEngine Dev Team
Derek Jones7a9193a2008-01-21 18:39:20 +000025 * @link http://codeigniter.com/user_guide/helpers/text_helper.html
Derek Allard3d879d52008-01-18 19:41:32 +000026 */
27
28// ------------------------------------------------------------------------
29
30/**
31 * Word Limiter
32 *
33 * Limits a string to X number of words.
34 *
35 * @access public
36 * @param string
37 * @param integer
38 * @param string the end character. Usually an ellipsis
39 * @return string
40 */
41function word_limiter($str, $n = 100, $end_char = '&#8230;')
42{
43 if (strlen($str) < $n)
44 {
45 return $str;
46 }
47
48 $words = explode(' ', preg_replace("/\s+/", ' ', preg_replace("/(\r\n|\r|\n)/", " ", $str)));
49
50 if (count($words) <= $n)
51 {
52 return $str;
53 }
54
55 $str = '';
56 for ($i = 0; $i < $n; $i++)
57 {
58 $str .= $words[$i].' ';
59 }
60
61 return trim($str).$end_char;
62}
63
64// ------------------------------------------------------------------------
65
66/**
67 * Character Limiter
68 *
69 * Limits the string based on the character count. Preserves complete words
70 * so the character count may not be exactly as specified.
71 *
72 * @access public
73 * @param string
74 * @param integer
75 * @param string the end character. Usually an ellipsis
76 * @return string
77 */
78function character_limiter($str, $n = 500, $end_char = '&#8230;')
79{
80 if (strlen($str) < $n)
81 {
82 return $str;
83 }
84
85 $str = preg_replace("/\s+/", ' ', preg_replace("/(\r\n|\r|\n)/", " ", $str));
86
87 if (strlen($str) <= $n)
88 {
89 return $str;
90 }
91
92 $out = "";
93 foreach (explode(' ', trim($str)) as $val)
94 {
95 $out .= $val.' ';
96 if (strlen($out) >= $n)
97 {
98 return trim($out).$end_char;
99 }
100 }
101}
102
103// ------------------------------------------------------------------------
104
105/**
106 * High ASCII to Entities
107 *
108 * Converts High ascii text and MS Word special characters to character entities
109 *
110 * @access public
111 * @param string
112 * @return string
113 */
114function ascii_to_entities($str)
115{
116 $count = 1;
117 $out = '';
118 $temp = array();
119
120 for ($i = 0, $s = strlen($str); $i < $s; $i++)
121 {
122 $ordinal = ord($str[$i]);
123
124 if ($ordinal < 128)
125 {
126 $out .= $str[$i];
127 }
128 else
129 {
130 if (count($temp) == 0)
131 {
132 $count = ($ordinal < 224) ? 2 : 3;
133 }
134
135 $temp[] = $ordinal;
136
137 if (count($temp) == $count)
138 {
139 $number = ($count == 3) ? (($temp['0'] % 16) * 4096) + (($temp['1'] % 64) * 64) + ($temp['2'] % 64) : (($temp['0'] % 32) * 64) + ($temp['1'] % 64);
140
141 $out .= '&#'.$number.';';
142 $count = 1;
143 $temp = array();
144 }
145 }
146 }
147
148 return $out;
149}
150
151// ------------------------------------------------------------------------
152
153/**
154 * Entities to ASCII
155 *
156 * Converts character entities back to ASCII
157 *
158 * @access public
159 * @param string
160 * @param bool
161 * @return string
162 */
163function entities_to_ascii($str, $all = TRUE)
164{
165 if (preg_match_all('/\&#(\d+)\;/', $str, $matches))
166 {
167 for ($i = 0, $s = count($matches['0']); $i < $s; $i++)
168 {
169 $digits = $matches['1'][$i];
170
171 $out = '';
172
173 if ($digits < 128)
174 {
175 $out .= chr($digits);
176
177 }
178 elseif ($digits < 2048)
179 {
180 $out .= chr(192 + (($digits - ($digits % 64)) / 64));
181 $out .= chr(128 + ($digits % 64));
182 }
183 else
184 {
185 $out .= chr(224 + (($digits - ($digits % 4096)) / 4096));
186 $out .= chr(128 + ((($digits % 4096) - ($digits % 64)) / 64));
187 $out .= chr(128 + ($digits % 64));
188 }
189
190 $str = str_replace($matches['0'][$i], $out, $str);
191 }
192 }
193
194 if ($all)
195 {
196 $str = str_replace(array("&amp;", "&lt;", "&gt;", "&quot;", "&apos;", "&#45;"),
197 array("&","<",">","\"", "'", "-"),
198 $str);
199 }
200
201 return $str;
202}
203
204// ------------------------------------------------------------------------
205
206/**
207 * Word Censoring Function
208 *
209 * Supply a string and an array of disallowed words and any
210 * matched words will be converted to #### or to the replacement
211 * word you've submitted.
212 *
213 * @access public
214 * @param string the text string
215 * @param string the array of censoered words
216 * @param string the optional replacement value
217 * @return string
218 */
219function word_censor($str, $censored, $replacement = '')
220{
221 if ( ! is_array($censored))
222 {
223 return $str;
224 }
225
226 $str = ' '.$str.' ';
227 foreach ($censored as $badword)
228 {
229 if ($replacement != '')
230 {
231 $str = preg_replace("/\b(".str_replace('\*', '\w*?', preg_quote($badword)).")\b/i", $replacement, $str);
232 }
233 else
234 {
235 $str = preg_replace("/\b(".str_replace('\*', '\w*?', preg_quote($badword)).")\b/ie", "str_repeat('#', strlen('\\1'))", $str);
236 }
237 }
238
239 return trim($str);
240}
241
242// ------------------------------------------------------------------------
243
244/**
245 * Code Highlighter
246 *
247 * Colorizes code strings
248 *
249 * @access public
250 * @param string the text string
251 * @return string
252 */
253function highlight_code($str)
254{
255 // The highlight string function encodes and highlights
256 // brackets so we need them to start raw
257 $str = str_replace(array('&lt;', '&gt;'), array('<', '>'), $str);
258
259 // Replace any existing PHP tags to temporary markers so they don't accidentally
260 // break the string out of PHP, and thus, thwart the highlighting.
261
Derek Jones9468f3e2008-01-22 19:19:27 +0000262 $str = str_replace(array('<?', '?>', '<%', '%>', '\\', '</script>'),
263 array('phptagopen', 'phptagclose', 'asptagopen', 'asptagclose', 'backslashtmp', 'scriptclose'), $str);
264
Derek Allard3d879d52008-01-18 19:41:32 +0000265 // The highlight_string function requires that the text be surrounded
266 // by PHP tags. Since we don't know if A) the submitted text has PHP tags,
267 // or B) whether the PHP tags enclose the entire string, we will add our
268 // own PHP tags around the string along with some markers to make replacement easier later
269
Derek Jonese3525492008-01-22 19:51:03 +0000270 $str = '<?php tempstart'."\n".$str.'tempend ?>';
Derek Allard3d879d52008-01-18 19:41:32 +0000271
272 // All the magic happens here, baby!
273 $str = highlight_string($str, TRUE);
274
275 // Prior to PHP 5, the highlight function used icky font tags
276 // so we'll replace them with span tags.
277 if (abs(phpversion()) < 5)
278 {
279 $str = str_replace(array('<font ', '</font>'), array('<span ', '</span>'), $str);
280 $str = preg_replace('#color="(.*?)"#', 'style="color: \\1"', $str);
281 }
282
Derek Jones9cee7912008-01-22 20:12:47 +0000283 // Remove our artificially added PHP
284 $str = preg_replace("#\<code\>.+?tempstart\<br />(?:\</span\>)?#is", "<code>\n", $str);
Derek Jonese3525492008-01-22 19:51:03 +0000285 $str = preg_replace("#tempend.+#is", "</span>\n</code>", $str);
Derek Allard3d879d52008-01-18 19:41:32 +0000286
287 // Replace our markers back to PHP tags.
Derek Jones9468f3e2008-01-22 19:19:27 +0000288 $str = str_replace(array('phptagopen', 'phptagclose', 'asptagopen', 'asptagclose', 'backslashtmp', 'scriptclose'),
289 array('&lt;?', '?&gt;', '&lt;%', '%&gt;', '\\', '&lt;/script&gt;'), $str);
290
Derek Allard3d879d52008-01-18 19:41:32 +0000291 return $str;
292}
293
294// ------------------------------------------------------------------------
295
296/**
297 * Phrase Highlighter
298 *
299 * Highlights a phrase within a text string
300 *
301 * @access public
302 * @param string the text string
303 * @param string the phrase you'd like to highlight
304 * @param string the openging tag to precede the phrase with
305 * @param string the closing tag to end the phrase with
306 * @return string
307 */
308function highlight_phrase($str, $phrase, $tag_open = '<strong>', $tag_close = '</strong>')
309{
310 if ($str == '')
311 {
312 return '';
313 }
314
315 if ($phrase != '')
316 {
317 return preg_replace('/('.preg_quote($phrase, '/').')/i', $tag_open."\\1".$tag_close, $str);
318 }
319
320 return $str;
321}
322
323// ------------------------------------------------------------------------
324
325/**
326 * Word Wrap
327 *
328 * Wraps text at the specified character. Maintains the integrity of words.
329 * Anything placed between {unwrap}{/unwrap} will not be word wrapped, nor
330 * will URLs.
331 *
332 * @access public
333 * @param string the text string
334 * @param integer the number of characters to wrap at
335 * @return string
336 */
337function word_wrap($str, $charlim = '76')
338{
339 // Se the character limit
340 if ( ! is_numeric($charlim))
341 $charlim = 76;
342
343 // Reduce multiple spaces
344 $str = preg_replace("| +|", " ", $str);
345
346 // Standardize newlines
347 $str = preg_replace("/\r\n|\r/", "\n", $str);
348
349 // If the current word is surrounded by {unwrap} tags we'll
350 // strip the entire chunk and replace it with a marker.
351 $unwrap = array();
352 if (preg_match_all("|(\{unwrap\}.+?\{/unwrap\})|s", $str, $matches))
353 {
354 for ($i = 0; $i < count($matches['0']); $i++)
355 {
356 $unwrap[] = $matches['1'][$i];
357 $str = str_replace($matches['1'][$i], "{{unwrapped".$i."}}", $str);
358 }
359 }
360
361 // Use PHP's native function to do the initial wordwrap.
362 // We set the cut flag to FALSE so that any individual words that are
363 // too long get left alone. In the next step we'll deal with them.
364 $str = wordwrap($str, $charlim, "\n", FALSE);
365
366 // Split the string into individual lines of text and cycle through them
367 $output = "";
368 foreach (explode("\n", $str) as $line)
369 {
370 // Is the line within the allowed character count?
371 // If so we'll join it to the output and continue
372 if (strlen($line) <= $charlim)
373 {
374 $output .= $line."\n";
375 continue;
376 }
377
378 $temp = '';
379 while((strlen($line)) > $charlim)
380 {
381 // If the over-length word is a URL we won't wrap it
382 if (preg_match("!\[url.+\]|://|wwww.!", $line))
383 {
384 break;
385 }
386
387 // Trim the word down
388 $temp .= substr($line, 0, $charlim-1);
389 $line = substr($line, $charlim-1);
390 }
391
392 // If $temp contains data it means we had to split up an over-length
393 // word into smaller chunks so we'll add it back to our current line
394 if ($temp != '')
395 {
396 $output .= $temp . "\n" . $line;
397 }
398 else
399 {
400 $output .= $line;
401 }
402
403 $output .= "\n";
404 }
405
406 // Put our markers back
407 if (count($unwrap) > 0)
408 {
409 foreach ($unwrap as $key => $val)
410 {
411 $output = str_replace("{{unwrapped".$key."}}", $val, $output);
412 }
413 }
414
415 // Remove the unwrap tags
416 $output = str_replace(array('{unwrap}', '{/unwrap}'), '', $output);
417
418 return $output;
419}
420
421
422?>