]> git.localhorst.tv Git - alttp.git/blobdiff - app/Models/ChatLog.php
fix check for spam
[alttp.git] / app / Models / ChatLog.php
index 8c890e707112acc3ade9ea8450b821def2c92915..943ce6e659e846effb274ba467c23ecfbd1470ff 100644 (file)
@@ -4,6 +4,8 @@ namespace App\Models;
 
 use Illuminate\Database\Eloquent\Factories\HasFactory;
 use Illuminate\Database\Eloquent\Model;
+use Illuminate\Support\Arr;
+use Illuminate\Support\Str;
 use LanguageDetector\LanguageDetector;
 
 class ChatLog extends Model {
@@ -32,7 +34,7 @@ class ChatLog extends Model {
                }
 
                if ($this->command == 'PRIVMSG') {
-                       if ($this->isKnownBot()) {
+                       if (static::isKnownBot($this->nick)) {
                                $this->type = 'bot';
                        } else if (substr($this->params[0], 0, 1) == '#') {
                                $this->type = 'chat';
@@ -44,26 +46,61 @@ class ChatLog extends Model {
                        if ($this->scanForSpam()) {
                                $this->banned = true;
                        }
+                       $this->classification = static::classify($this->text_content);
                        return;
                }
 
                throw new \Exception('unidentified message');
        }
 
-       public function isKnownBot() {
-               return in_array(strtolower($this->nick), [
+       public static function isKnownBot($nick) {
+               return in_array(strtolower($nick), [
                        'birrellthesquirrel',
                        'funtoon',
                        'nidbot2000',
                        'nightbot',
                        'pokemoncommunitygame',
                        'speedgaming',
+                       'starbase47',
                        'streamelements',
                        'wizebot',
                        'zockerstuebchen',
                ]);
        }
 
+       public static function classify($text) {
+               if (empty($text)) {
+                       return 'unclassified';
+               }
+               if (is_numeric(trim($text))) {
+                       return 'number';
+               }
+               $rawText = strtolower(preg_replace('/[^\w]/', '', $text));
+               $tokenizedText = preg_split('/\s+/', strtolower(trim($text)));
+               if (Str::startsWith($rawText, 'gg') || Str::endsWith($rawText, 'gg')) {
+                       return 'gg';
+               }
+               if (Str::contains($rawText, ['glgl', 'glhf', 'hfgl'])) {
+                       return 'gl';
+               }
+               if (Str::contains($rawText, ['haha', 'hehe', 'hihi', 'kekw', 'lol', 'lul', 'xd'])) {
+                       return 'lol';
+               }
+               if (Str::startsWith($rawText, ['ahoi', 'hallo', 'hello', 'hi', 'huhu']) || Str::endsWith($rawText, ['hi', 'wave'])) {
+                       return 'hi';
+               }
+               if (Str::contains($rawText, ['pog', 'wow'])) {
+                       return 'pog';
+               }
+               if (Str::contains($rawText, ['hype'])) {
+                       return 'hype';
+               }
+               if (Str::startsWith($rawText, 'o7') || Str::endsWith($rawText, 'o7') || Str::contains($rawText, 'salut')) {
+                       return 'o7';
+               }
+               return 'unclassified';
+       }
+
        protected function evaluateUser() {
        }
 
@@ -97,38 +134,42 @@ class ChatLog extends Model {
                }
        }
 
-       protected function scanForSpam() {
-               if (substr($this->text_content, 0, 1) == '!') {
+       public static function spammyText($text) {
+               if (substr($text, 0, 1) == '!') {
                        return true;
                }
-               if (strpos($this->text_content, '$') !== false) {
+               if (strpos($text, '$') !== false) {
                        return true;
                }
-               if (strpos($this->text_content, '€') !== false) {
+               if (strpos($text, '€') !== false) {
                        return true;
                }
-               if (strpos($this->text_content, '@') !== false) {
+               if (strpos($text, '@') !== false) {
                        return true;
                }
-               if (strpos($this->text_content, '://') !== false) {
+               if (strpos($text, '://') !== false) {
                        return true;
                }
-               if (is_numeric($this->text_content)) {
+               if (strpos($text, 'followers') !== false) {
                        return true;
                }
-               if (strpos($this->text_content, 'followers') !== false) {
+               if (strpos($text, 'promotion') !== false) {
                        return true;
                }
-               if (strpos($this->text_content, 'promotion') !== false) {
+               if (strpos($text, 'viewers') !== false) {
                        return true;
                }
-               if (strpos($this->text_content, 'viewers') !== false) {
+               if (strpos($text, 'view ers') !== false) {
                        return true;
                }
-               if (strpos($this->text_content, 'view ers') !== false) {
+               return false;
+       }
+
+       protected function scanForSpam() {
+               if (is_numeric($this->text_content)) {
                        return true;
                }
-               return false;
+               return static::spammyText($this->text_content);
        }
 
        protected $casts = [