From 17d885fed87ede236488e80552b9ee9557001e19 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?marcin=20miko=C5=82ajczak?= Date: Sat, 5 Nov 2022 20:16:32 +0100 Subject: [PATCH] Fix fasttext for multiline posts MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: marcin mikołajczak --- lib/pleroma/language/language_detector/fasttext.ex | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/lib/pleroma/language/language_detector/fasttext.ex b/lib/pleroma/language/language_detector/fasttext.ex index d479d2125..0f621a000 100644 --- a/lib/pleroma/language/language_detector/fasttext.ex +++ b/lib/pleroma/language/language_detector/fasttext.ex @@ -25,7 +25,7 @@ defmodule Pleroma.Language.LanguageDetector.Fasttext do def detect(text) do text_path = Path.join(System.tmp_dir!(), "fasttext-#{Ecto.UUID.generate()}") - File.write(text_path, text) + File.write(text_path, text |> String.replace(~r/\s+/, " ")) detected_language = case System.cmd("fasttext", ["predict", get_model(), text_path]) do