3 namespace App\TwitchBot;
5 use App\Models\ChatLog;
6 use Illuminate\Support\Arr;
7 use Illuminate\Support\Str;
9 class TokenizedMessage {
11 public function __construct($text, $tags = []) {
12 $this->text = trim($text);
14 $this->raw = strtolower(preg_replace('/[^\w]/u', '', $this->text));
15 $this->tokens = array_values(array_map('trim', array_filter(preg_split('/\b/', strtolower($this->text)))));
17 $this->emoteless = $this->text;
18 if (isset($this->tags['emotes']) && !empty($this->tags['emotes'])) {
19 $emotes = explode('/', $this->tags['emotes']);
20 foreach ($emotes as $emote) {
21 $set = explode(':', $emote);
22 $positions = explode(',', $set[1]);
23 foreach ($positions as $position) {
24 $coords = explode('-', $position);
25 $this->emotes[] = preg_replace('/\d+$/', '', strtolower(substr($this->text, $coords[0], $coords[1] - $coords[0] + 1)));
26 for ($i = intval($coords[0]); $i <= intval($coords[1]); ++$i) {
27 $this->emoteless[$i] = ' ';
31 $this->emoteless = trim(preg_replace('/\s+/', ' ', $this->emoteless));
33 $this->emoteless_raw = strtolower(preg_replace('/[^\w]/', '', $this->emoteless));
34 $this->emoteless_tokens = array_values(array_map('trim', array_filter(preg_split('/\b/', strtolower($this->emoteless)))));
37 public static function fromIRC(IRCMessage $msg) {
38 return new self($msg->getText(), $msg->tags);
41 public static function fromLog(ChatLog $log) {
42 return new self($log->params[1], $log->tags);
45 public static function fromString($text, $tags = []) {
46 return new self($text, $tags);
50 public function contains($text) {
51 return Str::contains($this->text, $text);
54 public function containsEmoteless($text) {
55 return Str::contains($this->emoteless, $text);
58 public function containsRaw($text) {
59 return Str::contains($this->raw, $text);
62 public function endsWith($text) {
63 return Str::endsWith($this->text, $text);
66 public function endsWithEmoteless($text) {
67 return Str::endsWith($this->emoteless, $text);
70 public function endsWithRaw($text) {
71 return Str::endsWith($this->raw, $text);
74 public function getNumericValue() {
75 return intval($this->text);
78 public function hasConsecutiveTokens($tokens) {
79 for ($i = 0; $i < count($this->tokens) - count($tokens) + 1; ++$i) {
80 for ($j = 0; $j < count($tokens); ++$j) {
81 if ($this->tokens[$i + $j] != $tokens[$j]) break;
83 if ($j == count($tokens)) return true;
88 public function hasEmote($text) {
89 if (is_array($text)) {
90 foreach ($text as $token) {
91 if (in_array($token, $this->emotes)) {
97 return in_array($text, $this->emotes);
100 public function hasEmoteThatContains($text) {
101 foreach ($this->emotes as $emote) {
102 if (Str::contains($emote, $text)) {
109 public function hasEmoteThatEndsWith($text) {
110 foreach ($this->emotes as $emote) {
111 if (Str::endsWith($emote, $text)) {
118 public function hasEmoteThatStartsOrEndsWith($text) {
119 foreach ($this->emotes as $emote) {
120 if (Str::startsWith($emote, $text) || Str::endsWith($emote, $text)) {
127 public function hasEmoteThatStartsWith($text) {
128 foreach ($this->emotes as $emote) {
129 if (Str::startsWith($emote, $text)) {
136 public function hasToken($text) {
137 if (is_array($text)) {
138 foreach ($text as $token) {
139 if (in_array($token, $this->tokens)) {
145 return in_array($text, $this->tokens);
148 public function hasTokenThatContains($text) {
149 foreach ($this->tokens as $token) {
150 if (Str::contains($token, $text)) {
157 public function hasTokenThatEndsWith($text) {
158 foreach ($this->tokens as $token) {
159 if (Str::endsWith($token, $text)) {
166 public function hasTokenThatStartsOrEndsWith($text) {
167 foreach ($this->tokens as $token) {
168 if (Str::startsWith($token, $text) || Str::endsWith($token, $text)) {
175 public function hasTokenThatStartsWith($text) {
176 foreach ($this->tokens as $token) {
177 if (Str::startsWith($token, $text)) {
184 public function startsOrEndsWith($text) {
185 return $this->startsWith($text) || $this->endsWith($text);
188 public function startsOrEndsWithRaw($text) {
189 return $this->startsWithRaw($text) || $this->endsWithRaw($text);
192 public function startsWith($text) {
193 return Str::startsWith($this->text, $text);
196 public function startsWithEmoteless($text) {
197 return Str::startsWith($this->emoteless, $text);
200 public function startsWithRaw($text) {
201 return Str::startsWith($this->raw, $text);
205 public function isSpammy() {
206 if ($this->startsWith('!')) {
209 if ($this->contains(['€', '$', '@', '://'])) {
212 if ($this->containsRaw(['followers', 'promotion', 'viewers'])) {
215 if ($this->containsRaw('horstie')) {
218 if ($this->containsRaw(['folgtjetzt', 'vielendankfürdenraid', 'thanksfortheraid', 'willkommenaufstarbase47'])) {
225 public function classify() {
226 if (is_null($this->classification)) {
227 if (empty($this->text)) {
228 $this->classification = 'unclassified';
229 } else if ($this->startsWith('!')) {
230 $this->classification = 'cmd';
231 } else if ($this->hasTokenThatStartsOrEndsWith(['gg']) || $this->hasEmoteThatEndsWith(['gg'])) {
232 $this->classification = 'gg';
233 } else if ($this->containsRaw(['glgl', 'glhf', 'goodluck', 'hfgl'])) {
234 $this->classification = 'gl';
235 } else if ($this->hasToken(['danke', 'thanks', 'thx', 'ty']) && !$this->hasToken(['nah', 'nee', 'nein', 'no'])) {
236 $this->classification = 'thx';
237 } else if ($this->startsWithRaw(['ahoi', 'hallo', 'hello', 'hey', 'huhu', 'moin']) || $this->hasEmoteThatEndsWith(['hello', 'heyguys', 'hi', 'vohiyo', 'wave']) || $this->hasToken(['hi', 'hey', 'yo']) || $this->containsRaw(['gutenmorgen', 'gutenabend'])) {
238 $this->classification = 'hi';
239 } else if ($this->hasTokenThatStartsOrEndsWith(['pog', 'wow'])) {
240 $this->classification = 'pog';
241 } else if ($this->containsRaw(['hype']) || $this->hasEmoteThatEndsWith(['dance', 'jam', 'party', 'rave', 'troete'])) {
242 $this->classification = 'hype';
243 } else if ($this->hasToken(['<3']) || $this->hasEmoteThatEndsWith(['heart', 'herz', 'hug', 'love'])) {
244 $this->classification = 'love';
245 } else if ($this->hasToken(['nani', 'wat', 'wtf']) || $this->hasEmoteThatEndsWith(['wat', 'wtf'])) {
246 $this->classification = 'wtf';
247 } else if ($this->hasConsecutiveTokens([':', 'eyes', ':']) || $this->hasEmoteThatEndsWith(['eyes'])) {
248 $this->classification = 'eyes';
249 } else if ($this->hasEmoteThatEndsWith(['angry', 'rage', 'ree'])) {
250 $this->classification = 'rage';
251 } else if ($this->hasToken([':(']) || $this->hasEmoteThatEndsWith(['cry', 'sad'])) {
252 $this->classification = 'sad';
253 } else if ($this->hasToken(['monkas', 'sweat_smile']) || $this->hasEmoteThatEndsWith(['sweat'])) {
254 $this->classification = 'sweat';
255 } else if ($this->endsWithEmoteless('?')) {
256 $this->classification = 'question';
257 } else if ($this->hasToken(['ja', 'jo', 'yep', 'yes']) || $this->containsRaw('nodders') || $this->hasEmoteThatEndsWith(['nod', 'nodders', 'yea'])) {
258 $this->classification = 'yes';
259 } else if ($this->hasToken(['nah', 'nee', 'nein', 'no']) || $this->containsRaw('nopers') || $this->hasEmoteThatEndsWith(['nay', 'nope', 'nopers'])) {
260 $this->classification = 'no';
261 } else if ($this->hasEmoteThatContains(['kappa', 'keepo'])) {
262 $this->classification = 'kappa';
263 } else if ($this->startsOrEndsWithRaw(['o7']) || $this->hasEmoteThatContains('salut')) {
264 $this->classification = 'o7';
265 } else if ($this->containsRaw(['haha', 'hehe', 'hihi', 'kekw', 'lol', 'lul']) || $this->hasTokenThatStartsWith(['xd']) || $this->hasConsecutiveTokens([':', 'd'])) {
266 $this->classification = 'lol';
267 } else if (is_numeric($this->raw)) {
268 $this->classification = 'number';
270 $this->classification = 'unclassified';
273 return $this->classification;
282 private $emotes = [];
283 private $emoteless = '';
284 private $emoteless_raw = '';
285 private $emoteless_tokens = [];
287 private $classification = null;