1: <?php
2:
3: 4: 5: 6: 7: 8: 9: 10: 11:
12:
13:
14:
15: 16: 17: 18: 19:
20: class NString
21: {
22:
23: 24: 25:
26: final public function __construct()
27: {
28: throw new LogicException("Cannot instantiate static class " . get_class($this));
29: }
30:
31:
32:
33: 34: 35: 36: 37: 38:
39: public static function checkEncoding($s, $encoding = 'UTF-8')
40: {
41: return $s === self::fixEncoding($s, $encoding);
42: }
43:
44:
45:
46: 47: 48: 49: 50: 51:
52: public static function fixEncoding($s, $encoding = 'UTF-8')
53: {
54: 55: return @iconv('UTF-16', $encoding . '//IGNORE', iconv($encoding, 'UTF-16//IGNORE', $s)); 56: }
57:
58:
59:
60: 61: 62: 63: 64: 65:
66: public static function chr($code, $encoding = 'UTF-8')
67: {
68: return iconv('UTF-32BE', $encoding . '//IGNORE', pack('N', $code));
69: }
70:
71:
72:
73: 74: 75: 76: 77: 78:
79: public static function startsWith($haystack, $needle)
80: {
81: return strncmp($haystack, $needle, strlen($needle)) === 0;
82: }
83:
84:
85:
86: 87: 88: 89: 90: 91:
92: public static function endsWith($haystack, $needle)
93: {
94: return strlen($needle) === 0 || substr($haystack, -strlen($needle)) === $needle;
95: }
96:
97:
98:
99: 100: 101: 102: 103:
104: public static function normalize($s)
105: {
106: 107: $s = str_replace("\r\n", "\n", $s); 108: $s = strtr($s, "\r", "\n"); 109:
110: 111: $s = preg_replace('#[\x00-\x08\x0B-\x1F]+#', '', $s);
112:
113: 114: $s = preg_replace("#[\t ]+$#m", '', $s);
115:
116: 117: $s = trim($s, "\n");
118:
119: return $s;
120: }
121:
122:
123:
124: 125: 126: 127: 128:
129: public static function toAscii($s)
130: {
131: $s = preg_replace('#[^\x09\x0A\x0D\x20-\x7E\xA0-\x{10FFFF}]#u', '', $s);
132: $s = strtr($s, '`\'"^~', "\x01\x02\x03\x04\x05");
133: if (ICONV_IMPL === 'glibc') {
134: $s = @iconv('UTF-8', 'WINDOWS-1250//TRANSLIT', $s); 135: $s = strtr($s, "\xa5\xa3\xbc\x8c\xa7\x8a\xaa\x8d\x8f\x8e\xaf\xb9\xb3\xbe\x9c\x9a\xba\x9d\x9f\x9e"
136: . "\xbf\xc0\xc1\xc2\xc3\xc4\xc5\xc6\xc7\xc8\xc9\xca\xcb\xcc\xcd\xce\xcf\xd0\xd1\xd2\xd3"
137: . "\xd4\xd5\xd6\xd7\xd8\xd9\xda\xdb\xdc\xdd\xde\xdf\xe0\xe1\xe2\xe3\xe4\xe5\xe6\xe7\xe8"
138: . "\xe9\xea\xeb\xec\xed\xee\xef\xf0\xf1\xf2\xf3\xf4\xf5\xf6\xf8\xf9\xfa\xfb\xfc\xfd\xfe",
139: "ALLSSSSTZZZallssstzzzRAAAALCCCEEEEIIDDNNOOOOxRUUUUYTsraaaalccceeeeiiddnnooooruuuuyt");
140: } else {
141: $s = @iconv('UTF-8', 'ASCII//TRANSLIT', $s); 142: }
143: $s = str_replace(array('`', "'", '"', '^', '~'), '', $s);
144: return strtr($s, "\x01\x02\x03\x04\x05", '`\'"^~');
145: }
146:
147:
148:
149: 150: 151: 152: 153: 154: 155:
156: public static function webalize($s, $charlist = NULL, $lower = TRUE)
157: {
158: $s = self::toAscii($s);
159: if ($lower) $s = strtolower($s);
160: $s = preg_replace('#[^a-z0-9' . preg_quote($charlist, '#') . ']+#i', '-', $s);
161: $s = trim($s, '-');
162: return $s;
163: }
164:
165:
166:
167: 168: 169: 170: 171: 172: 173:
174: public static function truncate($s, $maxLen, $append = "\xE2\x80\xA6")
175: {
176: if (self::length($s) > $maxLen) {
177: $maxLen = $maxLen - self::length($append);
178: if ($maxLen < 1) {
179: return $append;
180:
181: } elseif ($matches = self::match($s, '#^.{1,'.$maxLen.'}(?=[\s\x00-/:-@\[-`{-~])#us')) {
182: return $matches[0] . $append;
183:
184: } else {
185: return iconv_substr($s, 0, $maxLen, 'UTF-8') . $append;
186: }
187: }
188: return $s;
189: }
190:
191:
192:
193: 194: 195: 196: 197: 198: 199:
200: public static function indent($s, $level = 1, $chars = "\t")
201: {
202: return $level < 1 ? $s : self::replace($s, '#(?:^|[\r\n]+)(?=[^\r\n])#', '$0' . str_repeat($chars, $level));
203: }
204:
205:
206:
207: 208: 209: 210: 211:
212: public static function lower($s)
213: {
214: return mb_strtolower($s, 'UTF-8');
215: }
216:
217:
218:
219: 220: 221: 222: 223:
224: public static function upper($s)
225: {
226: return mb_strtoupper($s, 'UTF-8');
227: }
228:
229:
230:
231: 232: 233: 234: 235:
236: public static function firstUpper($s)
237: {
238: return self::upper(mb_substr($s, 0, 1, 'UTF-8')) . mb_substr($s, 1, self::length($s), 'UTF-8');
239: }
240:
241:
242:
243: 244: 245: 246: 247:
248: public static function capitalize($s)
249: {
250: return mb_convert_case($s, MB_CASE_TITLE, 'UTF-8');
251: }
252:
253:
254:
255: 256: 257: 258: 259: 260: 261:
262: public static function compare($left, $right, $len = NULL)
263: {
264: if ($len < 0) {
265: $left = iconv_substr($left, $len, -$len, 'UTF-8');
266: $right = iconv_substr($right, $len, -$len, 'UTF-8');
267: } elseif ($len !== NULL) {
268: $left = iconv_substr($left, 0, $len, 'UTF-8');
269: $right = iconv_substr($right, 0, $len, 'UTF-8');
270: }
271: return self::lower($left) === self::lower($right);
272: }
273:
274:
275:
276: 277: 278: 279: 280:
281: public static function length($s)
282: {
283: return function_exists('mb_strlen') ? mb_strlen($s, 'UTF-8') : strlen(utf8_decode($s));
284: }
285:
286:
287:
288: 289: 290: 291: 292: 293:
294: public static function trim($s, $charlist = " \t\n\r\0\x0B\xC2\xA0")
295: {
296: $charlist = preg_quote($charlist, '#');
297: return self::replace($s, '#^['.$charlist.']+|['.$charlist.']+$#u', '');
298: }
299:
300:
301:
302: 303: 304: 305: 306: 307: 308:
309: public static function padLeft($s, $length, $pad = ' ')
310: {
311: $length = max(0, $length - self::length($s));
312: $padLen = self::length($pad);
313: return str_repeat($pad, $length / $padLen) . iconv_substr($pad, 0, $length % $padLen, 'UTF-8') . $s;
314: }
315:
316:
317:
318: 319: 320: 321: 322: 323: 324:
325: public static function padRight($s, $length, $pad = ' ')
326: {
327: $length = max(0, $length - self::length($s));
328: $padLen = self::length($pad);
329: return $s . str_repeat($pad, $length / $padLen) . iconv_substr($pad, 0, $length % $padLen, 'UTF-8');
330: }
331:
332:
333:
334: 335: 336: 337: 338: 339:
340: public static function random($length = 10, $charlist = '0-9a-z')
341: {
342: $charlist = str_shuffle(preg_replace_callback('#.-.#', create_function('$m', '
343: return implode(\'\', range($m[0][0], $m[0][2]));
344: '), $charlist));
345: $chLen = strlen($charlist);
346:
347: $s = '';
348: for ($i = 0; $i < $length; $i++) {
349: if ($i % 5 === 0) {
350: $rand = lcg_value();
351: $rand2 = microtime(TRUE);
352: }
353: $rand *= $chLen;
354: $s .= $charlist[($rand + $rand2) % $chLen];
355: $rand -= (int) $rand;
356: }
357: return $s;
358: }
359:
360:
361:
362: 363: 364: 365: 366: 367: 368:
369: public static function split($subject, $pattern, $flags = 0)
370: {
371: NDebug::tryError();
372: $res = preg_split($pattern, $subject, -1, $flags | PREG_SPLIT_DELIM_CAPTURE);
373: self::catchPregError($pattern);
374: return $res;
375: }
376:
377:
378:
379: 380: 381: 382: 383: 384: 385: 386:
387: public static function match($subject, $pattern, $flags = 0, $offset = 0)
388: {
389: NDebug::tryError();
390: $res = preg_match($pattern, $subject, $m, $flags, $offset);
391: self::catchPregError($pattern);
392: if ($res) {
393: return $m;
394: }
395: }
396:
397:
398:
399: 400: 401: 402: 403: 404: 405: 406:
407: public static function matchAll($subject, $pattern, $flags = 0, $offset = 0)
408: {
409: NDebug::tryError();
410: $res = preg_match_all(
411: $pattern, $subject, $m,
412: ($flags & PREG_PATTERN_ORDER) ? $flags : ($flags | PREG_SET_ORDER),
413: $offset
414: );
415: self::catchPregError($pattern);
416: return $m;
417: }
418:
419:
420:
421: 422: 423: 424: 425: 426: 427: 428:
429: public static function replace($subject, $pattern, $replacement = NULL, $limit = -1)
430: {
431: NDebug::tryError();
432: if (is_object($replacement) || is_array($replacement)) {
433: if ($replacement instanceof NCallback) {
434: $replacement = $replacement->getNative();
435: }
436: if (!is_callable($replacement, FALSE, $textual)) {
437: NDebug::catchError($foo);
438: throw new InvalidStateException("Callback '$textual' is not callable.");
439: }
440: $res = preg_replace_callback($pattern, $replacement, $subject, $limit);
441:
442: if (NDebug::catchError($e)) { 443: $trace = $e->getTrace();
444: if (isset($trace[2]['class']) && $trace[2]['class'] === __CLASS__) {
445: throw new NRegexpException($e->getMessage() . " in pattern: $pattern");
446: }
447: }
448:
449: } elseif (is_array($pattern)) {
450: $res = preg_replace(array_keys($pattern), array_values($pattern), $subject, $limit);
451:
452: } else {
453: $res = preg_replace($pattern, $replacement, $subject, $limit);
454: }
455: self::catchPregError($pattern);
456: return $res;
457: }
458:
459:
460:
461:
462: public static function catchPregError($pattern)
463: {
464: if (NDebug::catchError($e)) { 465: throw new NRegexpException($e->getMessage() . " in pattern: $pattern");
466:
467: } elseif (preg_last_error()) { 468: static $messages = array(
469: PREG_INTERNAL_ERROR => 'Internal error',
470: PREG_BACKTRACK_LIMIT_ERROR => 'Backtrack limit was exhausted',
471: PREG_RECURSION_LIMIT_ERROR => 'Recursion limit was exhausted',
472: PREG_BAD_UTF8_ERROR => 'Malformed UTF-8 data',
473: 5 => 'Offset didn\'t correspond to the begin of a valid UTF-8 code point', 474: );
475: $code = preg_last_error();
476: throw new NRegexpException((isset($messages[$code]) ? $messages[$code] : 'Unknown error') . " (pattern: $pattern)", $code);
477: }
478: }
479:
480: }
481:
482:
483:
484: 485: 486:
487: class NRegexpException extends Exception
488: {
489: }
490: