X-Git-Url: https://git.localhorst.tv/?a=blobdiff_plain;f=app%2FModels%2FChatLog.php;h=3b4df15f2ac9596846729b91fc564c5780ca68b8;hb=29ee4d076868ce530e94a4dcea5d5cf8be772571;hp=05c1584e44a306dc47d4abc130fcde3f598370bc;hpb=05862d3235a4472abe49ae994bd927943744e451;p=alttp.git diff --git a/app/Models/ChatLog.php b/app/Models/ChatLog.php index 05c1584..3b4df15 100644 --- a/app/Models/ChatLog.php +++ b/app/Models/ChatLog.php @@ -6,7 +6,7 @@ use Illuminate\Database\Eloquent\Factories\HasFactory; use Illuminate\Database\Eloquent\Model; use Illuminate\Support\Arr; use Illuminate\Support\Str; -use LanguageDetector\LanguageDetector; +use LanguageDetection\Language; class ChatLog extends Model { @@ -20,6 +20,24 @@ class ChatLog extends Model { return $this->belongsTo(User::class); } + public function getTextWithoutEmotes() { + $text = $this->text_content; + if (isset($this->tags['emotes']) && !empty($this->tags['emotes'])) { + $emotes = explode('/', $this->tags['emotes']); + foreach ($emotes as $emote) { + $set = explode(':', $emote); + $positions = explode(',', $set[1]); + foreach ($positions as $position) { + $coords = explode('-', $position); + for ($i = intval($coords[0]); $i <= intval($coords[1]); ++$i) { + $text[$i] = ' '; + } + } + } + } + return trim(preg_replace('/\s+/', ' ', $text)); + } + public function evaluate() { $this->evaluateUser(); $this->evaluateChannel(); @@ -86,7 +104,7 @@ class ChatLog extends Model { if (Str::contains($rawText, ['haha', 'hehe', 'hihi', 'kekw', 'lol', 'lul', 'xd'])) { return 'lol'; } - if (Str::startsWith($rawText, ['ahoi', 'hallo', 'hello', 'hi', 'huhu']) || Str::endsWith($rawText, ['hi', 'wave'])) { + if (Str::startsWith($rawText, ['ahoi', 'hallo', 'hello', 'hi ', 'huhu']) || Str::endsWith($rawText, ['hi', 'wave'])) { return 'hi'; } if (Str::contains($rawText, ['pog', 'wow'])) { @@ -125,16 +143,17 @@ class ChatLog extends Model { $languages[] = 'en'; } } - $detector = LanguageDetector::detect($this->text_content, $languages); - $scores = $detector->getScores(); - $lang = strval($detector->getLanguage()); + $detector = (new Language($languages))->detect($this->getTextWithoutEmotes()); + $scores = $detector->close(); + $lang = strval($detector); //var_dump($scores, $lang, $this->text_content); - if (is_array($scores) && isset($scores[$lang]) && $scores[$lang] > 0.35) { + if (!empty($lang) && $scores[$lang] > 0.4) { $this->detected_language = $lang; } } - public static function spammyText($text) { + public static function spammyText($raw_text) { + $text = strtolower($raw_text); if (substr($text, 0, 1) == '!') { return true; } @@ -153,6 +172,9 @@ class ChatLog extends Model { if (strpos($text, 'followers') !== false) { return true; } + if (strpos($text, 'horstie') !== false) { + return true; + } if (strpos($text, 'promotion') !== false) { return true; } @@ -162,10 +184,10 @@ class ChatLog extends Model { if (strpos($text, 'view ers') !== false) { return true; } - if (strpos($text, 'vielen Dank für den Raid') !== false) { + if (strpos($text, 'vielen dank für den raid') !== false) { return true; } - if (strpos($text, 'Willkommen auf Starbase 47') !== false) { + if (strpos($text, 'willkommen auf starbase 47') !== false) { return true; } return false;