]> git.localhorst.tv Git - alttp.git/blobdiff - app/TwitchBot/TokenizedMessage.php
multibyte handling in emote tokenizer
[alttp.git] / app / TwitchBot / TokenizedMessage.php
index b32ba720a3cb0489d61143969b82f4e0e154f83a..37836a915235c7356d7bcac8b1d4939a90b63ce4 100644 (file)
@@ -22,15 +22,13 @@ class TokenizedMessage {
                                $positions = explode(',', $set[1]);
                                foreach ($positions as $position) {
                                        $coords = explode('-', $position);
-                                       $this->emotes[] = preg_replace('/\d+$/', '', strtolower(substr($this->text, $coords[0], $coords[1] - $coords[0] + 1)));
-                                       for ($i = intval($coords[0]); $i <= intval($coords[1]); ++$i) {
-                                               $this->emoteless[$i] = ' ';
-                                       }
+                                       $this->emotes[] = preg_replace('/\d+$/', '', strtolower(mb_substr($this->text, $coords[0], $coords[1] - $coords[0] + 1)));
+                                       $this->emoteless = mb_substr($this->emoteless, 0, $coords[0]).str_repeat(' ', $coords[1] - $coords[0] + 1).mb_substr($this->emoteless, $coords[1] + 1);
                                }
                        }
-                       $this->emoteless = trim(preg_replace('/\s+/', ' ', $this->emoteless));
+                       $this->emoteless = trim(preg_replace('/\s+/u', ' ', $this->emoteless));
                }
-               $this->emoteless_raw = strtolower(preg_replace('/[^\w]/', '', $this->emoteless));
+               $this->emoteless_raw = strtolower(preg_replace('/[^\w]/u', '', $this->emoteless));
                $this->emoteless_tokens = array_values(array_map('trim', array_filter(preg_split('/\b/u', strtolower($this->emoteless)))));
        }