2020-10-29 01:20:26 -04:00
|
|
|
<?php
|
|
|
|
/**
|
2021-03-29 02:40:20 -04:00
|
|
|
* @copyright Copyright (C) 2010-2021, the Friendica project
|
2020-10-29 01:20:26 -04:00
|
|
|
*
|
|
|
|
* @license GNU AGPL version 3 or any later version
|
|
|
|
*
|
|
|
|
* This program is free software: you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU Affero General Public License as
|
|
|
|
* published by the Free Software Foundation, either version 3 of the
|
|
|
|
* License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU Affero General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Affero General Public License
|
|
|
|
* along with this program. If not, see <https://www.gnu.org/licenses/>.
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
|
|
|
namespace Friendica\Model\Post;
|
|
|
|
|
2021-04-26 02:50:12 -04:00
|
|
|
use Friendica\Content\Text\BBCode;
|
2020-10-29 01:20:26 -04:00
|
|
|
use Friendica\Core\Logger;
|
|
|
|
use Friendica\Core\System;
|
2020-11-19 14:34:48 -05:00
|
|
|
use Friendica\Database\Database;
|
2020-10-29 01:20:26 -04:00
|
|
|
use Friendica\Database\DBA;
|
2020-10-31 09:26:08 -04:00
|
|
|
use Friendica\DI;
|
2021-04-29 17:05:22 -04:00
|
|
|
use Friendica\Model\Item;
|
|
|
|
use Friendica\Model\Post;
|
2020-10-29 01:20:26 -04:00
|
|
|
use Friendica\Util\Images;
|
2021-04-26 02:50:12 -04:00
|
|
|
use Friendica\Util\ParseUrl;
|
2021-04-29 14:23:04 -04:00
|
|
|
use Friendica\Util\Strings;
|
2020-10-29 01:20:26 -04:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Class Media
|
|
|
|
*
|
|
|
|
* This Model class handles media interactions.
|
|
|
|
* This tables stores medias (images, videos, audio files) related to posts.
|
|
|
|
*/
|
|
|
|
class Media
|
|
|
|
{
|
2021-04-14 15:12:01 -04:00
|
|
|
const UNKNOWN = 0;
|
|
|
|
const IMAGE = 1;
|
|
|
|
const VIDEO = 2;
|
|
|
|
const AUDIO = 3;
|
|
|
|
const TEXT = 4;
|
|
|
|
const APPLICATION = 5;
|
|
|
|
const TORRENT = 16;
|
|
|
|
const HTML = 17;
|
|
|
|
const XML = 18;
|
|
|
|
const PLAIN = 19;
|
|
|
|
const DOCUMENT = 128;
|
2020-10-29 01:20:26 -04:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Insert a post-media record
|
|
|
|
*
|
|
|
|
* @param array $media
|
|
|
|
* @return void
|
|
|
|
*/
|
2020-10-31 09:26:08 -04:00
|
|
|
public static function insert(array $media, bool $force = false)
|
2020-10-29 01:20:26 -04:00
|
|
|
{
|
2021-04-14 15:12:01 -04:00
|
|
|
if (empty($media['url']) || empty($media['uri-id']) || !isset($media['type'])) {
|
2020-10-31 09:26:08 -04:00
|
|
|
Logger::warning('Incomplete media data', ['media' => $media]);
|
2020-10-29 01:20:26 -04:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2021-05-08 07:03:50 -04:00
|
|
|
if (DBA::exists('post-media', ['uri-id' => $media['uri-id'], 'preview' => $media['url']])) {
|
|
|
|
Logger::info('Media already exists as preview', ['uri-id' => $media['uri-id'], 'url' => $media['url'], 'callstack' => System::callstack()]);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2020-10-31 09:26:08 -04:00
|
|
|
// "document" has got the lowest priority. So when the same file is both attached as document
|
2021-04-26 02:50:12 -04:00
|
|
|
// and embedded as picture then we only store the picture or replace the document
|
2020-10-31 09:26:08 -04:00
|
|
|
$found = DBA::selectFirst('post-media', ['type'], ['uri-id' => $media['uri-id'], 'url' => $media['url']]);
|
|
|
|
if (!$force && !empty($found) && (($found['type'] != self::DOCUMENT) || ($media['type'] == self::DOCUMENT))) {
|
2020-10-29 01:20:26 -04:00
|
|
|
Logger::info('Media already exists', ['uri-id' => $media['uri-id'], 'url' => $media['url'], 'callstack' => System::callstack()]);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2021-04-14 15:12:01 -04:00
|
|
|
$media = self::unsetEmptyFields($media);
|
2020-10-29 01:20:26 -04:00
|
|
|
|
2020-10-31 09:26:08 -04:00
|
|
|
// We are storing as fast as possible to avoid duplicated network requests
|
|
|
|
// when fetching additional information for pictures and other content.
|
2020-11-19 14:34:48 -05:00
|
|
|
$result = DBA::insert('post-media', $media, Database::INSERT_UPDATE);
|
2020-10-31 09:26:08 -04:00
|
|
|
Logger::info('Stored media', ['result' => $result, 'media' => $media, 'callstack' => System::callstack()]);
|
|
|
|
$stored = $media;
|
|
|
|
|
|
|
|
$media = self::fetchAdditionalData($media);
|
2021-04-14 15:12:01 -04:00
|
|
|
$media = self::unsetEmptyFields($media);
|
2020-10-31 09:26:08 -04:00
|
|
|
|
|
|
|
if (array_diff_assoc($media, $stored)) {
|
2020-11-19 14:34:48 -05:00
|
|
|
$result = DBA::insert('post-media', $media, Database::INSERT_UPDATE);
|
2020-10-31 09:26:08 -04:00
|
|
|
Logger::info('Updated media', ['result' => $result, 'media' => $media]);
|
|
|
|
} else {
|
2020-10-31 10:09:44 -04:00
|
|
|
Logger::info('Nothing to update', ['media' => $media]);
|
2020-10-31 09:26:08 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-04-14 15:12:01 -04:00
|
|
|
/**
|
|
|
|
* Remove empty media fields
|
|
|
|
*
|
|
|
|
* @param array $media
|
|
|
|
* @return array cleaned media array
|
|
|
|
*/
|
|
|
|
private static function unsetEmptyFields(array $media)
|
|
|
|
{
|
|
|
|
$fields = ['mimetype', 'height', 'width', 'size', 'preview', 'preview-height', 'preview-width', 'description'];
|
|
|
|
foreach ($fields as $field) {
|
|
|
|
if (empty($media[$field])) {
|
|
|
|
unset($media[$field]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return $media;
|
|
|
|
}
|
|
|
|
|
2020-11-07 03:22:59 -05:00
|
|
|
/**
|
|
|
|
* Copy attachments from one uri-id to another
|
|
|
|
*
|
|
|
|
* @param integer $from_uri_id
|
|
|
|
* @param integer $to_uri_id
|
|
|
|
* @return void
|
|
|
|
*/
|
|
|
|
public static function copy(int $from_uri_id, int $to_uri_id)
|
|
|
|
{
|
|
|
|
$attachments = self::getByURIId($from_uri_id);
|
|
|
|
foreach ($attachments as $attachment) {
|
|
|
|
$attachment['uri-id'] = $to_uri_id;
|
|
|
|
self::insert($attachment);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-10-31 09:26:08 -04:00
|
|
|
/**
|
|
|
|
* Creates the "[attach]" element from the given attributes
|
|
|
|
*
|
|
|
|
* @param string $href
|
|
|
|
* @param integer $length
|
|
|
|
* @param string $type
|
|
|
|
* @param string $title
|
|
|
|
* @return string "[attach]" element
|
|
|
|
*/
|
|
|
|
public static function getAttachElement(string $href, int $length, string $type, string $title = '')
|
|
|
|
{
|
|
|
|
$media = self::fetchAdditionalData(['type' => self::DOCUMENT, 'url' => $href,
|
|
|
|
'size' => $length, 'mimetype' => $type, 'description' => $title]);
|
|
|
|
|
|
|
|
return '[attach]href="' . $media['url'] . '" length="' . $media['size'] .
|
|
|
|
'" type="' . $media['mimetype'] . '" title="' . $media['description'] . '"[/attach]';
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Fetch additional data for the provided media array
|
|
|
|
*
|
|
|
|
* @param array $media
|
|
|
|
* @return array media array with additional data
|
|
|
|
*/
|
|
|
|
public static function fetchAdditionalData(array $media)
|
|
|
|
{
|
|
|
|
// Fetch the mimetype or size if missing.
|
2021-04-14 15:12:01 -04:00
|
|
|
if (empty($media['mimetype']) || empty($media['size'])) {
|
2020-10-31 09:26:08 -04:00
|
|
|
$timeout = DI::config()->get('system', 'xrd_timeout');
|
|
|
|
$curlResult = DI::httpRequest()->head($media['url'], ['timeout' => $timeout]);
|
|
|
|
if ($curlResult->isSuccess()) {
|
2021-04-14 15:12:01 -04:00
|
|
|
if (empty($media['mimetype'])) {
|
|
|
|
$media['mimetype'] = $curlResult->getHeader('Content-Type');
|
2020-10-31 09:26:08 -04:00
|
|
|
}
|
2021-04-14 15:12:01 -04:00
|
|
|
if (empty($media['size'])) {
|
|
|
|
$media['size'] = (int)$curlResult->getHeader('Content-Length');
|
2020-10-31 09:26:08 -04:00
|
|
|
}
|
2021-04-14 15:12:01 -04:00
|
|
|
} else {
|
|
|
|
Logger::notice('Could not fetch head', ['media' => $media]);
|
2020-10-31 09:26:08 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-04-14 15:12:01 -04:00
|
|
|
$filetype = !empty($media['mimetype']) ? strtolower(current(explode('/', $media['mimetype']))) : '';
|
2020-10-31 09:26:08 -04:00
|
|
|
|
|
|
|
if (($media['type'] == self::IMAGE) || ($filetype == 'image')) {
|
2020-10-29 01:20:26 -04:00
|
|
|
$imagedata = Images::getInfoFromURLCached($media['url']);
|
|
|
|
if (!empty($imagedata)) {
|
|
|
|
$media['mimetype'] = $imagedata['mime'];
|
|
|
|
$media['size'] = $imagedata['size'];
|
|
|
|
$media['width'] = $imagedata[0];
|
|
|
|
$media['height'] = $imagedata[1];
|
2021-04-14 15:12:01 -04:00
|
|
|
} else {
|
|
|
|
Logger::notice('No image data', ['media' => $media]);
|
2020-10-29 01:20:26 -04:00
|
|
|
}
|
|
|
|
if (!empty($media['preview'])) {
|
|
|
|
$imagedata = Images::getInfoFromURLCached($media['preview']);
|
|
|
|
if (!empty($imagedata)) {
|
|
|
|
$media['preview-width'] = $imagedata[0];
|
|
|
|
$media['preview-height'] = $imagedata[1];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2021-04-14 15:12:01 -04:00
|
|
|
|
|
|
|
if ($media['type'] != self::DOCUMENT) {
|
|
|
|
$media = self::addType($media);
|
|
|
|
}
|
|
|
|
|
2021-04-26 02:50:12 -04:00
|
|
|
if ($media['type'] == self::HTML) {
|
|
|
|
$data = ParseUrl::getSiteinfoCached($media['url'], false);
|
|
|
|
$media['preview'] = $data['images'][0]['src'] ?? null;
|
|
|
|
$media['preview-height'] = $data['images'][0]['height'] ?? null;
|
|
|
|
$media['preview-width'] = $data['images'][0]['width'] ?? null;
|
|
|
|
$media['description'] = $data['text'] ?? null;
|
|
|
|
$media['name'] = $data['title'] ?? null;
|
|
|
|
$media['author-url'] = $data['author_url'] ?? null;
|
|
|
|
$media['author-name'] = $data['author_name'] ?? null;
|
|
|
|
$media['author-image'] = $data['author_img'] ?? null;
|
|
|
|
$media['publisher-url'] = $data['publisher_url'] ?? null;
|
|
|
|
$media['publisher-name'] = $data['publisher_name'] ?? null;
|
|
|
|
$media['publisher-image'] = $data['publisher_img'] ?? null;
|
|
|
|
}
|
2020-10-31 09:26:08 -04:00
|
|
|
return $media;
|
2020-10-29 01:20:26 -04:00
|
|
|
}
|
|
|
|
|
2021-04-14 15:12:01 -04:00
|
|
|
/**
|
|
|
|
* Add the detected type to the media array
|
|
|
|
*
|
2021-04-26 02:50:12 -04:00
|
|
|
* @param array $data
|
2021-04-14 15:12:01 -04:00
|
|
|
* @return array data array with the detected type
|
|
|
|
*/
|
|
|
|
public static function addType(array $data)
|
|
|
|
{
|
|
|
|
if (empty($data['mimetype'])) {
|
|
|
|
Logger::info('No MimeType provided', ['media' => $data]);
|
|
|
|
return $data;
|
|
|
|
}
|
|
|
|
|
|
|
|
$type = explode('/', current(explode(';', $data['mimetype'])));
|
|
|
|
if (count($type) < 2) {
|
|
|
|
Logger::info('Unknown MimeType', ['type' => $type, 'media' => $data]);
|
|
|
|
$data['type'] = self::UNKNOWN;
|
|
|
|
return $data;
|
|
|
|
}
|
|
|
|
|
|
|
|
$filetype = strtolower($type[0]);
|
|
|
|
$subtype = strtolower($type[1]);
|
|
|
|
|
|
|
|
if ($filetype == 'image') {
|
|
|
|
$data['type'] = self::IMAGE;
|
|
|
|
} elseif ($filetype == 'video') {
|
|
|
|
$data['type'] = self::VIDEO;
|
|
|
|
} elseif ($filetype == 'audio') {
|
|
|
|
$data['type'] = self::AUDIO;
|
|
|
|
} elseif (($filetype == 'text') && ($subtype == 'html')) {
|
|
|
|
$data['type'] = self::HTML;
|
|
|
|
} elseif (($filetype == 'text') && ($subtype == 'xml')) {
|
|
|
|
$data['type'] = self::XML;
|
|
|
|
} elseif (($filetype == 'text') && ($subtype == 'plain')) {
|
|
|
|
$data['type'] = self::PLAIN;
|
|
|
|
} elseif ($filetype == 'text') {
|
|
|
|
$data['type'] = self::TEXT;
|
|
|
|
} elseif (($filetype == 'application') && ($subtype == 'x-bittorrent')) {
|
|
|
|
$data['type'] = self::TORRENT;
|
|
|
|
} elseif ($filetype == 'application') {
|
|
|
|
$data['type'] = self::APPLICATION;
|
|
|
|
} else {
|
|
|
|
$data['type'] = self::UNKNOWN;
|
|
|
|
Logger::info('Unknown type', ['filetype' => $filetype, 'subtype' => $subtype, 'media' => $data]);
|
|
|
|
return $data;
|
|
|
|
}
|
|
|
|
|
|
|
|
Logger::debug('Detected type', ['filetype' => $filetype, 'subtype' => $subtype, 'media' => $data]);
|
|
|
|
return $data;
|
|
|
|
}
|
|
|
|
|
2020-10-29 01:20:26 -04:00
|
|
|
/**
|
|
|
|
* Tests for path patterns that are usef for picture links in Friendica
|
|
|
|
*
|
|
|
|
* @param string $page Link to the image page
|
|
|
|
* @param string $preview Preview picture
|
|
|
|
* @return boolean
|
|
|
|
*/
|
|
|
|
private static function isPictureLink(string $page, string $preview)
|
|
|
|
{
|
|
|
|
return preg_match('#/photos/.*/image/#ism', $page) && preg_match('#/photo/.*-1\.#ism', $preview);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Add media links and remove them from the body
|
|
|
|
*
|
|
|
|
* @param integer $uriid
|
|
|
|
* @param string $body
|
|
|
|
* @return string Body without media links
|
|
|
|
*/
|
2020-10-29 04:48:08 -04:00
|
|
|
public static function insertFromBody(int $uriid, string $body)
|
2020-10-29 01:20:26 -04:00
|
|
|
{
|
|
|
|
// Simplify image codes
|
2021-05-11 19:39:08 -04:00
|
|
|
$unshared_body = $body = preg_replace("/\[img\=([0-9]*)x([0-9]*)\](.*?)\[\/img\]/ism", '[img]$3[/img]', $body);
|
2020-10-29 01:20:26 -04:00
|
|
|
|
2021-05-11 19:39:08 -04:00
|
|
|
// Only remove the shared data from "real" reshares
|
|
|
|
$shared = BBCode::fetchShareAttributes($body);
|
|
|
|
if (!empty($shared['guid'])) {
|
|
|
|
$unshared_body = preg_replace("/\s*\[share .*?\].*?\[\/share\]\s*/ism", '', $body);
|
|
|
|
}
|
2021-05-02 13:33:32 -04:00
|
|
|
|
2020-10-29 01:20:26 -04:00
|
|
|
$attachments = [];
|
|
|
|
if (preg_match_all("#\[url=([^\]]+?)\]\s*\[img=([^\[\]]*)\]([^\[\]]*)\[\/img\]\s*\[/url\]#ism", $body, $pictures, PREG_SET_ORDER)) {
|
|
|
|
foreach ($pictures as $picture) {
|
|
|
|
if (!self::isPictureLink($picture[1], $picture[2])) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
$body = str_replace($picture[0], '', $body);
|
|
|
|
$image = str_replace('-1.', '-0.', $picture[2]);
|
2021-04-26 02:50:12 -04:00
|
|
|
$attachments[$image] = ['uri-id' => $uriid, 'type' => self::IMAGE, 'url' => $image,
|
2020-10-29 01:20:26 -04:00
|
|
|
'preview' => $picture[2], 'description' => $picture[3]];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (preg_match_all("/\[img=([^\[\]]*)\]([^\[\]]*)\[\/img\]/Usi", $body, $pictures, PREG_SET_ORDER)) {
|
|
|
|
foreach ($pictures as $picture) {
|
|
|
|
$body = str_replace($picture[0], '', $body);
|
2021-04-26 02:50:12 -04:00
|
|
|
$attachments[$picture[1]] = ['uri-id' => $uriid, 'type' => self::IMAGE, 'url' => $picture[1], 'description' => $picture[2]];
|
2020-10-29 01:20:26 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (preg_match_all("#\[url=([^\]]+?)\]\s*\[img\]([^\[]+?)\[/img\]\s*\[/url\]#ism", $body, $pictures, PREG_SET_ORDER)) {
|
|
|
|
foreach ($pictures as $picture) {
|
|
|
|
if (!self::isPictureLink($picture[1], $picture[2])) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
$body = str_replace($picture[0], '', $body);
|
|
|
|
$image = str_replace('-1.', '-0.', $picture[2]);
|
2021-04-26 02:50:12 -04:00
|
|
|
$attachments[$image] = ['uri-id' => $uriid, 'type' => self::IMAGE, 'url' => $image,
|
2020-10-29 01:20:26 -04:00
|
|
|
'preview' => $picture[2], 'description' => null];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (preg_match_all("/\[img\]([^\[\]]*)\[\/img\]/ism", $body, $pictures, PREG_SET_ORDER)) {
|
|
|
|
foreach ($pictures as $picture) {
|
|
|
|
$body = str_replace($picture[0], '', $body);
|
2021-04-26 02:50:12 -04:00
|
|
|
$attachments[$picture[1]] = ['uri-id' => $uriid, 'type' => self::IMAGE, 'url' => $picture[1]];
|
2020-10-29 01:20:26 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (preg_match_all("/\[audio\]([^\[\]]*)\[\/audio\]/ism", $body, $audios, PREG_SET_ORDER)) {
|
|
|
|
foreach ($audios as $audio) {
|
|
|
|
$body = str_replace($audio[0], '', $body);
|
2021-04-26 02:50:12 -04:00
|
|
|
$attachments[$audio[1]] = ['uri-id' => $uriid, 'type' => self::AUDIO, 'url' => $audio[1]];
|
2020-10-29 01:20:26 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (preg_match_all("/\[video\]([^\[\]]*)\[\/video\]/ism", $body, $videos, PREG_SET_ORDER)) {
|
|
|
|
foreach ($videos as $video) {
|
|
|
|
$body = str_replace($video[0], '', $body);
|
2021-04-26 02:50:12 -04:00
|
|
|
$attachments[$video[1]] = ['uri-id' => $uriid, 'type' => self::VIDEO, 'url' => $video[1]];
|
2020-10-29 01:20:26 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
foreach ($attachments as $attachment) {
|
2021-05-02 13:33:32 -04:00
|
|
|
// Only store attachments that are part of the unshared body
|
|
|
|
if (strpos($unshared_body, $attachment['url']) !== false) {
|
|
|
|
self::insert($attachment);
|
|
|
|
}
|
2020-10-29 01:20:26 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
return trim($body);
|
|
|
|
}
|
2020-10-31 09:26:08 -04:00
|
|
|
|
2021-05-04 01:18:03 -04:00
|
|
|
/**
|
|
|
|
* Add media links from a relevant url in the body
|
|
|
|
*
|
|
|
|
* @param integer $uriid
|
|
|
|
* @param string $body
|
|
|
|
*/
|
|
|
|
public static function insertFromRelevantUrl(int $uriid, string $body)
|
|
|
|
{
|
2021-05-11 19:39:08 -04:00
|
|
|
// Only remove the shared data from "real" reshares
|
|
|
|
$shared = BBCode::fetchShareAttributes($body);
|
|
|
|
if (!empty($shared['guid'])) {
|
|
|
|
// Don't look at the shared content
|
|
|
|
$body = preg_replace("/\s*\[share .*?\].*?\[\/share\]\s*/ism", '', $body);
|
|
|
|
}
|
2021-05-04 01:18:03 -04:00
|
|
|
|
|
|
|
// Remove all hashtags and mentions
|
|
|
|
$body = preg_replace("/([#@!])\[url\=(.*?)\](.*?)\[\/url\]/ism", '', $body);
|
|
|
|
|
|
|
|
// Search for pure links
|
|
|
|
if (preg_match_all("/\[url\](https?:.*?)\[\/url\]/ism", $body, $matches)) {
|
|
|
|
foreach ($matches[1] as $url) {
|
|
|
|
Logger::info('Got page url (link without description)', ['uri-id' => $uriid, 'url' => $url]);
|
|
|
|
self::insert(['uri-id' => $uriid, 'type' => self::UNKNOWN, 'url' => $url]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Search for links with descriptions
|
|
|
|
if (preg_match_all("/\[url\=(https?:.*?)\].*?\[\/url\]/ism", $body, $matches)) {
|
|
|
|
foreach ($matches[1] as $url) {
|
|
|
|
Logger::info('Got page url (link with description)', ['uri-id' => $uriid, 'url' => $url]);
|
|
|
|
self::insert(['uri-id' => $uriid, 'type' => self::UNKNOWN, 'url' => $url]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-04-26 02:50:12 -04:00
|
|
|
/**
|
|
|
|
* Add media links from the attachment field
|
|
|
|
*
|
|
|
|
* @param integer $uriid
|
|
|
|
* @param string $body
|
|
|
|
*/
|
|
|
|
public static function insertFromAttachmentData(int $uriid, string $body)
|
|
|
|
{
|
2021-05-02 13:33:32 -04:00
|
|
|
// Don't look at the shared content
|
|
|
|
$body = preg_replace("/\s*\[share .*?\].*?\[\/share\]\s*/ism", '', $body);
|
|
|
|
|
2021-04-26 02:50:12 -04:00
|
|
|
$data = BBCode::getAttachmentData($body);
|
|
|
|
if (empty($data)) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
Logger::info('Adding attachment data', ['data' => $data]);
|
|
|
|
$attachment = [
|
|
|
|
'uri-id' => $uriid,
|
|
|
|
'type' => self::HTML,
|
|
|
|
'url' => $data['url'],
|
|
|
|
'preview' => $data['preview'] ?? null,
|
|
|
|
'description' => $data['description'] ?? null,
|
|
|
|
'name' => $data['title'] ?? null,
|
|
|
|
'author-url' => $data['author_url'] ?? null,
|
|
|
|
'author-name' => $data['author_name'] ?? null,
|
|
|
|
'publisher-url' => $data['provider_url'] ?? null,
|
|
|
|
'publisher-name' => $data['provider_name'] ?? null,
|
|
|
|
];
|
|
|
|
if (!empty($data['image'])) {
|
|
|
|
$attachment['preview'] = $data['image'];
|
|
|
|
}
|
|
|
|
self::insert($attachment);
|
|
|
|
}
|
|
|
|
|
2020-10-31 09:26:08 -04:00
|
|
|
/**
|
|
|
|
* Add media links from the attach field
|
|
|
|
*
|
|
|
|
* @param integer $uriid
|
|
|
|
* @param string $attach
|
|
|
|
* @return void
|
|
|
|
*/
|
|
|
|
public static function insertFromAttachment(int $uriid, string $attach)
|
|
|
|
{
|
|
|
|
if (!preg_match_all('|\[attach\]href=\"(.*?)\" length=\"(.*?)\" type=\"(.*?)\"(?: title=\"(.*?)\")?|', $attach, $matches, PREG_SET_ORDER)) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
foreach ($matches as $attachment) {
|
|
|
|
$media['type'] = self::DOCUMENT;
|
|
|
|
$media['uri-id'] = $uriid;
|
|
|
|
$media['url'] = $attachment[1];
|
|
|
|
$media['size'] = $attachment[2];
|
|
|
|
$media['mimetype'] = $attachment[3];
|
|
|
|
$media['description'] = $attachment[4] ?? '';
|
|
|
|
|
|
|
|
self::insert($media);
|
|
|
|
}
|
|
|
|
}
|
2020-10-31 12:10:27 -04:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Retrieves the media attachments associated with the provided item ID.
|
|
|
|
*
|
|
|
|
* @param int $uri_id
|
2020-11-05 23:14:29 -05:00
|
|
|
* @param array $types
|
2020-10-31 12:10:27 -04:00
|
|
|
* @return array
|
|
|
|
* @throws \Exception
|
|
|
|
*/
|
2020-11-05 23:14:29 -05:00
|
|
|
public static function getByURIId(int $uri_id, array $types = [])
|
2020-10-31 12:10:27 -04:00
|
|
|
{
|
2020-11-05 23:14:29 -05:00
|
|
|
$condition = ['uri-id' => $uri_id];
|
|
|
|
|
|
|
|
if (!empty($types)) {
|
|
|
|
$condition = DBA::mergeConditions($condition, ['type' => $types]);
|
|
|
|
}
|
|
|
|
|
|
|
|
return DBA::selectToArray('post-media', [], $condition);
|
2020-10-31 12:10:27 -04:00
|
|
|
}
|
2021-04-26 02:50:12 -04:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Checks if media attachments are associated with the provided item ID.
|
|
|
|
*
|
|
|
|
* @param int $uri_id
|
|
|
|
* @param array $types
|
|
|
|
* @return array
|
|
|
|
* @throws \Exception
|
|
|
|
*/
|
|
|
|
public static function existsByURIId(int $uri_id, array $types = [])
|
|
|
|
{
|
|
|
|
$condition = ['uri-id' => $uri_id];
|
|
|
|
|
|
|
|
if (!empty($types)) {
|
|
|
|
$condition = DBA::mergeConditions($condition, ['type' => $types]);
|
|
|
|
}
|
|
|
|
|
|
|
|
return DBA::exists('post-media', $condition);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Split the attachment media in the three segments "visual", "link" and "additional"
|
|
|
|
*
|
2021-04-29 01:45:35 -04:00
|
|
|
* @param int $uri_id
|
2021-04-28 15:05:46 -04:00
|
|
|
* @param string $guid
|
2021-04-29 01:45:35 -04:00
|
|
|
* @param array $links ist of links that shouldn't be added
|
2021-04-26 02:50:12 -04:00
|
|
|
* @return array attachments
|
|
|
|
*/
|
2021-04-29 01:45:35 -04:00
|
|
|
public static function splitAttachments(int $uri_id, string $guid = '', array $links = [])
|
2021-04-26 02:50:12 -04:00
|
|
|
{
|
|
|
|
$attachments = ['visual' => [], 'link' => [], 'additional' => []];
|
|
|
|
|
|
|
|
$media = self::getByURIId($uri_id);
|
|
|
|
if (empty($media)) {
|
|
|
|
return $attachments;
|
|
|
|
}
|
|
|
|
|
2021-04-28 15:05:46 -04:00
|
|
|
$height = 0;
|
|
|
|
$selected = '';
|
2021-05-08 07:03:50 -04:00
|
|
|
$previews = [];
|
2021-04-28 15:05:46 -04:00
|
|
|
|
2021-04-26 02:50:12 -04:00
|
|
|
foreach ($media as $medium) {
|
2021-04-29 14:23:04 -04:00
|
|
|
foreach ($links as $link) {
|
|
|
|
if (Strings::compareLink($link, $medium['url'])) {
|
|
|
|
continue 2;
|
|
|
|
}
|
2021-04-29 01:45:35 -04:00
|
|
|
}
|
|
|
|
|
2021-05-08 07:03:50 -04:00
|
|
|
// Avoid adding separate media entries for previews
|
|
|
|
foreach ($previews as $preview) {
|
|
|
|
if (Strings::compareLink($preview, $medium['url'])) {
|
|
|
|
continue 2;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!empty($medium['preview'])) {
|
|
|
|
$previews[] = $medium['preview'];
|
|
|
|
}
|
|
|
|
|
2021-04-26 02:50:12 -04:00
|
|
|
$type = explode('/', current(explode(';', $medium['mimetype'])));
|
|
|
|
if (count($type) < 2) {
|
|
|
|
Logger::info('Unknown MimeType', ['type' => $type, 'media' => $medium]);
|
|
|
|
$filetype = 'unkn';
|
|
|
|
$subtype = 'unkn';
|
|
|
|
} else {
|
|
|
|
$filetype = strtolower($type[0]);
|
|
|
|
$subtype = strtolower($type[1]);
|
|
|
|
}
|
|
|
|
|
|
|
|
$medium['filetype'] = $filetype;
|
|
|
|
$medium['subtype'] = $subtype;
|
|
|
|
|
|
|
|
if ($medium['type'] == self::HTML || (($filetype == 'text') && ($subtype == 'html'))) {
|
|
|
|
$attachments['link'][] = $medium;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2021-04-28 15:05:46 -04:00
|
|
|
if (in_array($medium['type'], [self::AUDIO, self::IMAGE]) ||
|
|
|
|
in_array($filetype, ['audio', 'image'])) {
|
|
|
|
$attachments['visual'][] = $medium;
|
|
|
|
} elseif (($medium['type'] == self::VIDEO) || ($filetype == 'video')) {
|
|
|
|
if (strpos($medium['url'], $guid) !== false) {
|
|
|
|
// Peertube videos are delivered in many different resolutions. We pick a moderate one.
|
|
|
|
// By checking against the GUID we also ensure to only work this way on Peertube posts.
|
|
|
|
// This wouldn't be executed when someone for example on Mastodon was sharing multiple videos in a single post.
|
|
|
|
if (empty($height) || ($height > $medium['height']) && ($medium['height'] >= 480)) {
|
|
|
|
$height = $medium['height'];
|
|
|
|
$selected = $medium['url'];
|
|
|
|
}
|
|
|
|
$video[$medium['url']] = $medium;
|
|
|
|
} else {
|
2021-04-26 02:50:12 -04:00
|
|
|
$attachments['visual'][] = $medium;
|
2021-04-28 15:05:46 -04:00
|
|
|
}
|
2021-04-26 02:50:12 -04:00
|
|
|
} else {
|
2021-04-28 15:05:46 -04:00
|
|
|
$attachments['additional'][] = $medium;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (!empty($selected)) {
|
|
|
|
$attachments['visual'][] = $video[$selected];
|
|
|
|
unset($video[$selected]);
|
|
|
|
foreach ($video as $element) {
|
|
|
|
$attachments['additional'][] = $element;
|
2021-04-26 02:50:12 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return $attachments;
|
|
|
|
}
|
2021-04-29 17:05:22 -04:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Add media attachments to the body
|
|
|
|
*
|
|
|
|
* @param int $uriid
|
2021-04-30 18:35:16 -04:00
|
|
|
* @param string $body
|
2021-04-29 17:05:22 -04:00
|
|
|
* @return string body
|
|
|
|
*/
|
2021-04-30 18:35:16 -04:00
|
|
|
public static function addAttachmentsToBody(int $uriid, string $body = '')
|
2021-04-29 17:05:22 -04:00
|
|
|
{
|
2021-04-30 18:35:16 -04:00
|
|
|
if (empty($body)) {
|
|
|
|
$item = Post::selectFirst(['body'], ['uri-id' => $uriid]);
|
|
|
|
if (!DBA::isResult($item)) {
|
|
|
|
return '';
|
|
|
|
}
|
|
|
|
$body = $item['body'];
|
2021-04-29 17:05:22 -04:00
|
|
|
}
|
2021-05-01 03:10:27 -04:00
|
|
|
$original_body = $body;
|
|
|
|
|
2021-04-30 18:35:16 -04:00
|
|
|
$body = preg_replace("/\s*\[attachment .*?\].*?\[\/attachment\]\s*/ism", '', $body);
|
2021-04-29 17:05:22 -04:00
|
|
|
|
|
|
|
foreach (self::getByURIId($uriid, [self::IMAGE, self::AUDIO, self::VIDEO]) as $media) {
|
|
|
|
if (Item::containsLink($body, $media['url'])) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($media['type'] == self::IMAGE) {
|
2021-05-02 13:33:32 -04:00
|
|
|
if (!empty($media['preview'])) {
|
|
|
|
if (!empty($media['description'])) {
|
|
|
|
$body .= "\n[url=" . $media['url'] . "][img=" . $media['preview'] . ']' . $media['description'] .'[/img][/url]';
|
|
|
|
} else {
|
|
|
|
$body .= "\n[url=" . $media['url'] . "][img]" . $media['preview'] .'[/img][/url]';
|
|
|
|
}
|
2021-04-29 17:05:22 -04:00
|
|
|
} else {
|
2021-05-02 13:33:32 -04:00
|
|
|
if (!empty($media['description'])) {
|
|
|
|
$body .= "\n[img=" . $media['url'] . ']' . $media['description'] .'[/img]';
|
|
|
|
} else {
|
|
|
|
$body .= "\n[img]" . $media['url'] .'[/img]';
|
|
|
|
}
|
2021-04-29 17:05:22 -04:00
|
|
|
}
|
|
|
|
} elseif ($media['type'] == self::AUDIO) {
|
|
|
|
$body .= "\n[audio]" . $media['url'] . "[/audio]\n";
|
|
|
|
} elseif ($media['type'] == self::VIDEO) {
|
|
|
|
$body .= "\n[video]" . $media['url'] . "[/video]\n";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-05-01 03:10:27 -04:00
|
|
|
if (preg_match("/.*(\[attachment.*?\].*?\[\/attachment\]).*/ism", $original_body, $match)) {
|
2021-04-29 17:05:22 -04:00
|
|
|
$body .= "\n" . $match[1];
|
|
|
|
}
|
|
|
|
|
|
|
|
return $body;
|
|
|
|
}
|
2020-10-29 01:20:26 -04:00
|
|
|
}
|