|
| 1 | +<?php |
| 2 | +namespace anlutro\Menu\Util; |
| 3 | + |
| 4 | +class StringUtils |
| 5 | +{ |
| 6 | + public static function slug($string, $separator = '-') |
| 7 | + { |
| 8 | + foreach (static::charsArray() as $key => $value) { |
| 9 | + $string = str_replace($value, $key, $string); |
| 10 | + } |
| 11 | + |
| 12 | + $string = preg_replace('/[^\x20-\x7E]/u', '', $string); |
| 13 | + |
| 14 | + // convert all dashes/underscores into separator |
| 15 | + $flip = ($separator == '-') ? '_' : '-'; |
| 16 | + |
| 17 | + $string = preg_replace('!['.preg_quote($flip).']+!u', $separator, $string); |
| 18 | + |
| 19 | + // remove all characters that are not the separator, letters, numbers, or whitespace. |
| 20 | + $string = preg_replace('![^'.preg_quote($separator).'\pL\pN\s]+!u', '', mb_strtolower($string)); |
| 21 | + |
| 22 | + // replace all separator characters and whitespace by a single separator |
| 23 | + $string = preg_replace('!['.preg_quote($separator).'\s]+!u', $separator, $string); |
| 24 | + |
| 25 | + return trim($string, $separator); |
| 26 | + } |
| 27 | + |
| 28 | + protected static function charsArray() |
| 29 | + { |
| 30 | + static $charsArray; |
| 31 | + if (isset($charsArray)) return $charsArray; |
| 32 | + |
| 33 | + return $charsArray = array( |
| 34 | + 'a' => array( |
| 35 | + 'à', 'á', 'ả', 'ã', 'ạ', 'ă', 'ắ', 'ằ', 'ẳ', 'ẵ', |
| 36 | + 'ặ', 'â', 'ấ', 'ầ', 'ẩ', 'ẫ', 'ậ', 'ä', 'ā', 'ą', |
| 37 | + 'å', 'α', 'ά', 'ἀ', 'ἁ', 'ἂ', 'ἃ', 'ἄ', 'ἅ', 'ἆ', |
| 38 | + 'ἇ', 'ᾀ', 'ᾁ', 'ᾂ', 'ᾃ', 'ᾄ', 'ᾅ', 'ᾆ', 'ᾇ', 'ὰ', |
| 39 | + 'ά', 'ᾰ', 'ᾱ', 'ᾲ', 'ᾳ', 'ᾴ', 'ᾶ', 'ᾷ', 'а'), |
| 40 | + 'b' => array('б', 'β'), |
| 41 | + 'c' => array('ç', 'ć', 'č', 'ĉ', 'ċ'), |
| 42 | + 'd' => array('ď', 'ð', 'đ', 'ƌ', 'ȡ', 'ɖ', 'ɗ', 'ᵭ', 'ᶁ', 'ᶑ', |
| 43 | + 'д'), |
| 44 | + 'e' => array('é', 'è', 'ẻ', 'ẽ', 'ẹ', 'ê', 'ế', 'ề', 'ể', 'ễ', |
| 45 | + 'ệ', 'ë', 'ē', 'ę', 'ě', 'ĕ', 'ė', 'ε', 'έ', 'ἐ', |
| 46 | + 'ἑ', 'ἒ', 'ἓ', 'ἔ', 'ἕ', 'ὲ', 'έ', 'е', 'ё', 'э', |
| 47 | + 'є'), |
| 48 | + 'f' => array('ф'), |
| 49 | + 'g' => array('ĝ', 'ğ', 'ġ', 'ģ', 'г', 'ґ'), |
| 50 | + 'h' => array('ĥ', 'ħ'), |
| 51 | + 'i' => array('í', 'ì', 'ỉ', 'ĩ', 'ị', 'î', 'ï', 'ī', 'ĭ', 'į', |
| 52 | + 'ı', 'ι', 'ί', 'ϊ', 'ΐ', 'ἰ', 'ἱ', 'ἲ', 'ἳ', 'ἴ', |
| 53 | + 'ἵ', 'ἶ', 'ἷ', 'ὶ', 'ί', 'ῐ', 'ῑ', 'ῒ', 'ΐ', 'ῖ', |
| 54 | + 'ῗ', 'і', 'ї', 'и'), |
| 55 | + 'j' => array('ĵ'), |
| 56 | + 'k' => array('ķ', 'ĸ', 'к'), |
| 57 | + 'l' => array('ł', 'ľ', 'ĺ', 'ļ', 'ŀ', 'л'), |
| 58 | + 'm' => array('м'), |
| 59 | + 'n' => array('ñ', 'ń', 'ň', 'ņ', 'ʼn', 'ŋ', 'ν', 'н'), |
| 60 | + 'o' => array('ó', 'ò', 'ỏ', 'õ', 'ọ', 'ô', 'ố', 'ồ', 'ổ', 'ỗ', |
| 61 | + 'ộ', 'ơ', 'ớ', 'ờ', 'ở', 'ỡ', 'ợ', 'ø', 'ō', 'ő', |
| 62 | + 'ŏ', 'ο', 'ὀ', 'ὁ', 'ὂ', 'ὃ', 'ὄ', 'ὅ', 'ὸ', 'ό', |
| 63 | + 'ö', 'о'), |
| 64 | + 'p' => array('п'), |
| 65 | + 'r' => array('ŕ', 'ř', 'ŗ', 'р'), |
| 66 | + 's' => array('ś', 'š', 'ş', 'с'), |
| 67 | + 't' => array('ť', 'ţ', 'т'), |
| 68 | + 'u' => array('ú', 'ù', 'ủ', 'ũ', 'ụ', 'ư', 'ứ', 'ừ', 'ử', 'ữ', |
| 69 | + 'ự', 'ü', 'û', 'ū', 'ů', 'ű', 'ŭ', 'ų', 'µ', 'у'), |
| 70 | + 'v' => array('в'), |
| 71 | + 'w' => array('ŵ'), |
| 72 | + 'y' => array('ý', 'ỳ', 'ỷ', 'ỹ', 'ỵ', 'ÿ', 'ŷ', 'й', 'ы'), |
| 73 | + 'z' => array('ź', 'ž', 'ż', 'з'), |
| 74 | + 'ch' => array('ч'), |
| 75 | + 'kh' => array('х'), |
| 76 | + 'oe' => array('œ'), |
| 77 | + 'sh' => array('ш'), |
| 78 | + 'shch' => array('щ'), |
| 79 | + 'ts' => array('ц'), |
| 80 | + 'ya' => array('я'), |
| 81 | + 'yu' => array('ю'), |
| 82 | + 'zh' => array('ж'), |
| 83 | + 'A' => array('Á', 'À', 'Ả', 'Ã', 'Ạ', 'Ă', 'Ắ', 'Ằ', 'Ẳ', 'Ẵ', |
| 84 | + 'Ặ', 'Â', 'Ấ', 'Ầ', 'Ẩ', 'Ẫ', 'Ậ', 'Ä', 'Å', 'Ā', |
| 85 | + 'Ą', 'Α', 'Ά', 'Ἀ', 'Ἁ', 'Ἂ', 'Ἃ', 'Ἄ', 'Ἅ', 'Ἆ', |
| 86 | + 'Ἇ', 'ᾈ', 'ᾉ', 'ᾊ', 'ᾋ', 'ᾌ', 'ᾍ', 'ᾎ', 'ᾏ', 'Ᾰ', |
| 87 | + 'Ᾱ', 'Ὰ', 'Ά', 'ᾼ', 'А'), |
| 88 | + 'B' => array('Б'), |
| 89 | + 'C' => array('Ć', 'Č', 'Ĉ', 'Ċ'), |
| 90 | + 'D' => array('Ď', 'Ð', 'Đ', 'Ɖ', 'Ɗ', 'Ƌ', 'ᴅ', 'ᴆ', 'Д'), |
| 91 | + 'E' => array('É', 'È', 'Ẻ', 'Ẽ', 'Ẹ', 'Ê', 'Ế', 'Ề', 'Ể', 'Ễ', |
| 92 | + 'Ệ', 'Ë', 'Ē', 'Ę', 'Ě', 'Ĕ', 'Ė', 'Ε', 'Έ', 'Ἐ', |
| 93 | + 'Ἑ', 'Ἒ', 'Ἓ', 'Ἔ', 'Ἕ', 'Έ', 'Ὲ', 'Е', 'Ё', 'Э', |
| 94 | + 'Є'), |
| 95 | + 'F' => array('Ф'), |
| 96 | + 'G' => array('Ğ', 'Ġ', 'Ģ', 'Г', 'Ґ'), |
| 97 | + 'I' => array('Í', 'Ì', 'Ỉ', 'Ĩ', 'Ị', 'Î', 'Ï', 'Ī', 'Ĭ', 'Į', |
| 98 | + 'İ', 'Ι', 'Ί', 'Ϊ', 'Ἰ', 'Ἱ', 'Ἳ', 'Ἴ', 'Ἵ', 'Ἶ', |
| 99 | + 'Ἷ', 'Ῐ', 'Ῑ', 'Ὶ', 'Ί', 'И', 'І', 'Ї'), |
| 100 | + 'K' => array('К'), |
| 101 | + 'L' => array('Ĺ', 'Ł', 'Л'), |
| 102 | + 'M' => array('М'), |
| 103 | + 'N' => array('Ń', 'Ñ', 'Ň', 'Ņ', 'Ŋ', 'Н'), |
| 104 | + 'O' => array('Ó', 'Ò', 'Ỏ', 'Õ', 'Ọ', 'Ô', 'Ố', 'Ồ', 'Ổ', 'Ỗ', |
| 105 | + 'Ộ', 'Ơ', 'Ớ', 'Ờ', 'Ở', 'Ỡ', 'Ợ', 'Ö', 'Ø', 'Ō', |
| 106 | + 'Ő', 'Ŏ', 'Ο', 'Ό', 'Ὀ', 'Ὁ', 'Ὂ', 'Ὃ', 'Ὄ', 'Ὅ', |
| 107 | + 'Ὸ', 'Ό', 'О'), |
| 108 | + 'P' => array('П'), |
| 109 | + 'R' => array('Ř', 'Ŕ', 'Р'), |
| 110 | + 'S' => array('Ş', 'Ŝ', 'Ș', 'Š', 'Ś', 'С'), |
| 111 | + 'T' => array('Ť', 'Ţ', 'Ŧ', 'Ț', 'Т'), |
| 112 | + 'U' => array('Ú', 'Ù', 'Ủ', 'Ũ', 'Ụ', 'Ư', 'Ứ', 'Ừ', 'Ử', 'Ữ', |
| 113 | + 'Ự', 'Û', 'Ü', 'Ū', 'Ů', 'Ű', 'Ŭ', 'Ų', 'У'), |
| 114 | + 'V' => array('В'), |
| 115 | + 'Y' => array('Ý', 'Ỳ', 'Ỷ', 'Ỹ', 'Ỵ', 'Ÿ', 'Ῠ', 'Ῡ', 'Ὺ', 'Ύ', |
| 116 | + 'Ы', 'Й'), |
| 117 | + 'Z' => array('Ź', 'Ž', 'Ż', 'З'), |
| 118 | + 'CH' => array('Ч'), |
| 119 | + 'KH' => array('Х'), |
| 120 | + 'SH' => array('Ш'), |
| 121 | + 'SHCH' => array('Щ'), |
| 122 | + 'TS' => array('Ц'), |
| 123 | + 'YA' => array('Я'), |
| 124 | + 'YU' => array('Ю'), |
| 125 | + 'ZH' => array('Ж'), |
| 126 | + ' ' => array("\xC2\xA0", "\xE2\x80\x80", "\xE2\x80\x81", |
| 127 | + "\xE2\x80\x82", "\xE2\x80\x83", "\xE2\x80\x84", |
| 128 | + "\xE2\x80\x85", "\xE2\x80\x86", "\xE2\x80\x87", |
| 129 | + "\xE2\x80\x88", "\xE2\x80\x89", "\xE2\x80\x8A", |
| 130 | + "\xE2\x80\xAF", "\xE2\x81\x9F", "\xE3\x80\x80"), |
| 131 | + ); |
| 132 | + } |
| 133 | +} |
0 commit comments