mirror of
https://github.com/friendica/friendica
synced 2025-04-30 19:44:24 +02:00
Improve plaintext generation for language detection
This commit is contained in:
parent
cc42c0ba27
commit
16224a7001
2 changed files with 24 additions and 1 deletions
|
@ -2476,7 +2476,17 @@ class Item
|
|||
return '';
|
||||
}
|
||||
|
||||
$naked_body = BBCode::toPlaintext($item['body'], false);
|
||||
// Convert attachments to links
|
||||
$naked_body = BBCode::removeAttachment($item['body']);
|
||||
|
||||
// Remove links and pictures
|
||||
$naked_body = BBCode::removeLinks($naked_body);
|
||||
|
||||
// Convert the title and the body to plain text
|
||||
$naked_body = trim($item['title'] . "\n" . BBCode::toPlaintext($naked_body));
|
||||
|
||||
// Remove possibly remaining links
|
||||
$naked_body = preg_replace(Strings::autoLinkRegEx(), '', $naked_body);
|
||||
|
||||
$ld = new Language();
|
||||
$languages = $ld->detect($naked_body)->limit(0, 3)->close();
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue