]> git.localhorst.tv Git - alttp.git/blobdiff - app/Models/ChatLog.php
switch to (slightly) better language detection model
[alttp.git] / app / Models / ChatLog.php
index 79eab97debff1a56a6ee081efbdf59951f22a5d9..e17076aee164871121663d9976cdbc796699238f 100644 (file)
@@ -6,7 +6,7 @@ use Illuminate\Database\Eloquent\Factories\HasFactory;
 use Illuminate\Database\Eloquent\Model;
 use Illuminate\Support\Arr;
 use Illuminate\Support\Str;
-use LanguageDetector\LanguageDetector;
+use LanguageDetection\Language;
 
 class ChatLog extends Model {
 
@@ -86,7 +86,7 @@ class ChatLog extends Model {
                if (Str::contains($rawText, ['haha', 'hehe', 'hihi', 'kekw', 'lol', 'lul', 'xd'])) {
                        return 'lol';
                }
-               if (Str::startsWith($rawText, ['ahoi', 'hallo', 'hello', 'hi', 'huhu']) || Str::endsWith($rawText, ['hi', 'wave'])) {
+               if (Str::startsWith($rawText, ['ahoi', 'hallo', 'hello', 'hi ', 'huhu']) || Str::endsWith($rawText, ['hi', 'wave'])) {
                        return 'hi';
                }
                if (Str::contains($rawText, ['pog', 'wow'])) {
@@ -125,11 +125,11 @@ class ChatLog extends Model {
                                $languages[] = 'en';
                        }
                }
-               $detector = LanguageDetector::detect($this->text_content, $languages);
-               $scores = $detector->getScores();
-               $lang = strval($detector->getLanguage());
+               $detector = (new Language($languages))->detect($this->text_content);
+               $scores = $detector->close();
+               $lang = strval($detector);
                //var_dump($scores, $lang, $this->text_content);
-               if (is_array($scores) && isset($scores[$lang]) && $scores[$lang] > 0.35) {
+               if (!empty($lang) && $scores[$lang] > 0.4) {
                        $this->detected_language = $lang;
                }
        }