]> git.mxchange.org Git - friendica.git/blob - src/Model/Post/Media.php
ab17789724f250f3cf0b37c2fb2a2340273cd653
[friendica.git] / src / Model / Post / Media.php
1 <?php
2 /**
3  * @copyright Copyright (C) 2010-2023, the Friendica project
4  *
5  * @license GNU AGPL version 3 or any later version
6  *
7  * This program is free software: you can redistribute it and/or modify
8  * it under the terms of the GNU Affero General Public License as
9  * published by the Free Software Foundation, either version 3 of the
10  * License, or (at your option) any later version.
11  *
12  * This program is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15  * GNU Affero General Public License for more details.
16  *
17  * You should have received a copy of the GNU Affero General Public License
18  * along with this program.  If not, see <https://www.gnu.org/licenses/>.
19  *
20  */
21
22 namespace Friendica\Model\Post;
23
24 use Friendica\Content\PageInfo;
25 use Friendica\Content\Text\BBCode;
26 use Friendica\Core\Logger;
27 use Friendica\Core\Protocol;
28 use Friendica\Core\System;
29 use Friendica\Database\Database;
30 use Friendica\Database\DBA;
31 use Friendica\DI;
32 use Friendica\Model\Contact;
33 use Friendica\Model\Item;
34 use Friendica\Model\ItemURI;
35 use Friendica\Model\Photo;
36 use Friendica\Model\Post;
37 use Friendica\Network\HTTPClient\Client\HttpClientAccept;
38 use Friendica\Network\HTTPClient\Client\HttpClientOptions;
39 use Friendica\Util\Images;
40 use Friendica\Util\Network;
41 use Friendica\Util\ParseUrl;
42 use Friendica\Util\Proxy;
43 use Friendica\Util\Strings;
44
45 /**
46  * Class Media
47  *
48  * This Model class handles media interactions.
49  * This tables stores medias (images, videos, audio files) related to posts.
50  */
51 class Media
52 {
53         const UNKNOWN     = 0;
54         const IMAGE       = 1;
55         const VIDEO       = 2;
56         const AUDIO       = 3;
57         const TEXT        = 4;
58         const APPLICATION = 5;
59         const TORRENT     = 16;
60         const HTML        = 17;
61         const XML         = 18;
62         const PLAIN       = 19;
63         const ACTIVITY    = 20;
64         const ACCOUNT     = 21;
65         const DOCUMENT    = 128;
66
67         /**
68          * Insert a post-media record
69          *
70          * @param array $media
71          * @param bool  $force
72          * @return bool
73          */
74         public static function insert(array $media, bool $force = false): bool
75         {
76                 if (empty($media['url']) || empty($media['uri-id']) || !isset($media['type'])) {
77                         Logger::warning('Incomplete media data', ['media' => $media]);
78                         return false;
79                 }
80
81                 if (DBA::exists('post-media', ['uri-id' => $media['uri-id'], 'preview' => $media['url']])) {
82                         Logger::info('Media already exists as preview', ['uri-id' => $media['uri-id'], 'url' => $media['url'], 'callstack' => System::callstack()]);
83                         return false;
84                 }
85
86                 // "document" has got the lowest priority. So when the same file is both attached as document
87                 // and embedded as picture then we only store the picture or replace the document
88                 $found = DBA::selectFirst('post-media', ['type'], ['uri-id' => $media['uri-id'], 'url' => $media['url']]);
89                 if (!$force && !empty($found) && (($found['type'] != self::DOCUMENT) || ($media['type'] == self::DOCUMENT))) {
90                         Logger::info('Media already exists', ['uri-id' => $media['uri-id'], 'url' => $media['url'], 'callstack' => System::callstack()]);
91                         return false;
92                 }
93
94                 if (!ItemURI::exists($media['uri-id'])) {
95                         Logger::info('Media referenced URI ID not found', ['uri-id' => $media['uri-id'], 'url' => $media['url'], 'callstack' => System::callstack()]);
96                         return false;
97                 }
98
99                 $media = self::unsetEmptyFields($media);
100                 $media = DI::dbaDefinition()->truncateFieldsForTable('post-media', $media);
101
102                 // We are storing as fast as possible to avoid duplicated network requests
103                 // when fetching additional information for pictures and other content.
104                 $result = DBA::insert('post-media', $media, Database::INSERT_UPDATE);
105                 Logger::info('Stored media', ['result' => $result, 'media' => $media, 'callstack' => System::callstack()]);
106                 $stored = $media;
107
108                 $media = self::fetchAdditionalData($media);
109                 $media = self::unsetEmptyFields($media);
110                 $media = DI::dbaDefinition()->truncateFieldsForTable('post-media', $media);
111
112                 if (array_diff_assoc($media, $stored)) {
113                         $result = DBA::insert('post-media', $media, Database::INSERT_UPDATE);
114                         Logger::info('Updated media', ['result' => $result, 'media' => $media]);
115                 } else {
116                         Logger::info('Nothing to update', ['media' => $media]);
117                 }
118                 return $result;
119         }
120
121         /**
122          * Remove empty media fields
123          *
124          * @param array $media
125          * @return array cleaned media array
126          */
127         private static function unsetEmptyFields(array $media): array
128         {
129                 $fields = ['mimetype', 'height', 'width', 'size', 'preview', 'preview-height', 'preview-width', 'blurhash', 'description'];
130                 foreach ($fields as $field) {
131                         if (empty($media[$field])) {
132                                 unset($media[$field]);
133                         }
134                 }
135                 return $media;
136         }
137
138         /**
139          * Copy attachments from one uri-id to another
140          *
141          * @param integer $from_uri_id
142          * @param integer $to_uri_id
143          * @return void
144          */
145         public static function copy(int $from_uri_id, int $to_uri_id)
146         {
147                 $attachments = self::getByURIId($from_uri_id);
148                 foreach ($attachments as $attachment) {
149                         $attachment['uri-id'] = $to_uri_id;
150                         self::insert($attachment);
151                 }
152         }
153
154         /**
155          * Creates the "[attach]" element from the given attributes
156          *
157          * @param string $href
158          * @param integer $length
159          * @param string $type
160          * @param string $title
161          * @return string "[attach]" element
162          */
163         public static function getAttachElement(string $href, int $length, string $type, string $title = ''): string
164         {
165                 $media = self::fetchAdditionalData([
166                         'type' => self::DOCUMENT, 'url' => $href,
167                         'size' => $length, 'mimetype' => $type, 'description' => $title
168                 ]);
169
170                 return '[attach]href="' . $media['url'] . '" length="' . $media['size'] .
171                         '" type="' . $media['mimetype'] . '" title="' . $media['description'] . '"[/attach]';
172         }
173
174         /**
175          * Fetch additional data for the provided media array
176          *
177          * @param array $media
178          * @return array media array with additional data
179          */
180         public static function fetchAdditionalData(array $media): array
181         {
182                 if (Network::isLocalLink($media['url'])) {
183                         $media = self::fetchLocalData($media);
184                 }
185
186                 // Fetch the mimetype or size if missing.
187                 if (Network::isValidHttpUrl($media['url']) && (empty($media['mimetype']) || empty($media['size']))) {
188                         $timeout = DI::config()->get('system', 'xrd_timeout');
189                         $curlResult = DI::httpClient()->head($media['url'], [HttpClientOptions::TIMEOUT => $timeout]);
190
191                         // Workaround for systems that can't handle a HEAD request
192                         if (!$curlResult->isSuccess() && ($curlResult->getReturnCode() == 405)) {
193                                 $curlResult = DI::httpClient()->get($media['url'], HttpClientAccept::DEFAULT, [HttpClientOptions::TIMEOUT => $timeout]);
194                         }
195
196                         if ($curlResult->isSuccess()) {
197                                 if (empty($media['mimetype'])) {
198                                         $media['mimetype'] = $curlResult->getHeader('Content-Type')[0] ?? '';
199                                 }
200                                 if (empty($media['size'])) {
201                                         $media['size'] = (int)($curlResult->getHeader('Content-Length')[0] ?? 0);
202                                 }
203                         } else {
204                                 Logger::notice('Could not fetch head', ['media' => $media]);
205                         }
206                 }
207
208                 $filetype = !empty($media['mimetype']) ? strtolower(current(explode('/', $media['mimetype']))) : '';
209
210                 if (($media['type'] == self::IMAGE) || ($filetype == 'image')) {
211                         $imagedata = Images::getInfoFromURLCached($media['url']);
212                         if ($imagedata) {
213                                 $media['mimetype'] = $imagedata['mime'];
214                                 $media['size'] = $imagedata['size'];
215                                 $media['width'] = $imagedata[0];
216                                 $media['height'] = $imagedata[1];
217                                 $media['blurhash'] = $imagedata['blurhash'] ?? null;
218                         } else {
219                                 Logger::notice('No image data', ['media' => $media]);
220                         }
221                         if (!empty($media['preview'])) {
222                                 $imagedata = Images::getInfoFromURLCached($media['preview']);
223                                 if ($imagedata) {
224                                         $media['preview-width'] = $imagedata[0];
225                                         $media['preview-height'] = $imagedata[1];
226                                 }
227                         }
228                 }
229
230                 if ($media['type'] != self::DOCUMENT) {
231                         $media = self::addType($media);
232                 }
233
234                 if (in_array($media['type'], [self::TEXT, self::APPLICATION, self::HTML, self::XML, self::PLAIN])) {
235                         $media = self::addActivity($media);
236                 }
237
238                 if (in_array($media['type'], [self::TEXT, self::APPLICATION, self::HTML, self::XML, self::PLAIN])) {
239                         $media = self::addAccount($media);
240                 }
241
242                 if ($media['type'] == self::HTML) {
243                         $media = self::addPage($media);
244                 }
245
246                 return $media;
247         }
248
249         /**
250          * Adds the activity type if the media entry is linked to an activity
251          *
252          * @param array $media
253          * @return array
254          */
255         private static function addActivity(array $media): array
256         {
257                 $id = Item::fetchByLink($media['url']);
258                 if (empty($id)) {
259                         return $media;
260                 }
261
262                 $item = Post::selectFirst([], ['id' => $id, 'network' => Protocol::FEDERATED]);
263                 if (empty($item['id'])) {
264                         Logger::debug('Not a federated activity', ['id' => $id, 'uri-id' => $media['uri-id'], 'url' => $media['url']]);
265                         return $media;
266                 }
267
268                 if (
269                         !empty($item['plink']) && Strings::compareLink($item['plink'], $media['url']) &&
270                         parse_url($item['plink'], PHP_URL_HOST) != parse_url($item['uri'], PHP_URL_HOST)
271                 ) {
272                         Logger::debug('Not a link to an activity', ['uri-id' => $media['uri-id'], 'url' => $media['url'], 'plink' => $item['plink'], 'uri' => $item['uri']]);
273                         return $media;
274                 }
275
276                 if (in_array($item['network'], [Protocol::ACTIVITYPUB, Protocol::DFRN])) {
277                         $media['mimetype'] = 'application/activity+json';
278                 } elseif ($item['network'] == Protocol::DIASPORA) {
279                         $media['mimetype'] = 'application/xml';
280                 }
281
282                 $contact = Contact::getById($item['author-id'], ['avatar', 'gsid']);
283                 if (!empty($contact['gsid'])) {
284                         $gserver = DBA::selectFirst('gserver', ['url', 'site_name'], ['id' => $contact['gsid']]);
285                 }
286
287                 $media['type'] = self::ACTIVITY;
288                 $media['media-uri-id'] = $item['uri-id'];
289                 $media['height'] = null;
290                 $media['width'] = null;
291                 $media['preview'] = null;
292                 $media['preview-height'] = null;
293                 $media['preview-width'] = null;
294                 $media['blurhash'] = null;
295                 $media['description'] = $item['body'];
296                 $media['name'] = $item['title'];
297                 $media['author-url'] = $item['author-link'];
298                 $media['author-name'] = $item['author-name'];
299                 $media['author-image'] = $contact['avatar'] ?? $item['author-avatar'];
300                 $media['publisher-url'] = $gserver['url'] ?? null;
301                 $media['publisher-name'] = $gserver['site_name'] ?? null;
302                 $media['publisher-image'] = null;
303
304                 Logger::debug('Activity detected', ['uri-id' => $media['uri-id'], 'url' => $media['url'], 'plink' => $item['plink'], 'uri' => $item['uri']]);
305                 return $media;
306         }
307
308         /**
309          * Adds the account type if the media entry is linked to an account
310          *
311          * @param array $media
312          * @return array
313          */
314         private static function addAccount(array $media): array
315         {
316                 $contact = Contact::getByURL($media['url'], false);
317                 if (empty($contact) || ($contact['network'] == Protocol::PHANTOM)) {
318                         return $media;
319                 }
320
321                 if (in_array($contact['network'], [Protocol::ACTIVITYPUB, Protocol::DFRN])) {
322                         $media['mimetype'] = 'application/activity+json';
323                 }
324
325                 if (!empty($contact['gsid'])) {
326                         $gserver = DBA::selectFirst('gserver', ['url', 'site_name'], ['id' => $contact['gsid']]);
327                 }
328
329                 $media['type'] = self::ACCOUNT;
330                 $media['media-uri-id'] = $contact['uri-id'];
331                 $media['height'] = null;
332                 $media['width'] = null;
333                 $media['preview'] = null;
334                 $media['preview-height'] = null;
335                 $media['preview-width'] = null;
336                 $media['blurhash'] = null;
337                 $media['description'] = $contact['about'];
338                 $media['name'] = $contact['name'];
339                 $media['author-url'] = $contact['url'];
340                 $media['author-name'] = $contact['name'];
341                 $media['author-image'] = $contact['avatar'];
342                 $media['publisher-url'] = $gserver['url'] ?? null;
343                 $media['publisher-name'] = $gserver['site_name'] ?? null;
344                 $media['publisher-image'] = null;
345
346                 Logger::debug('Account detected', ['uri-id' => $media['uri-id'], 'url' => $media['url'], 'uri' => $contact['url']]);
347                 return $media;
348         }
349
350         /**
351          * Add page infos for HTML entries
352          *
353          * @param array $media
354          * @return array
355          */
356         private static function addPage(array $media): array
357         {
358                 $data = ParseUrl::getSiteinfoCached($media['url'], false);
359                 $media['preview'] = $data['images'][0]['src'] ?? null;
360                 $media['preview-height'] = $data['images'][0]['height'] ?? null;
361                 $media['preview-width'] = $data['images'][0]['width'] ?? null;
362                 $media['blurhash'] = $data['images'][0]['blurhash'] ?? null;
363                 $media['description'] = $data['text'] ?? null;
364                 $media['name'] = $data['title'] ?? null;
365                 $media['author-url'] = $data['author_url'] ?? null;
366                 $media['author-name'] = $data['author_name'] ?? null;
367                 $media['author-image'] = $data['author_img'] ?? null;
368                 $media['publisher-url'] = $data['publisher_url'] ?? null;
369                 $media['publisher-name'] = $data['publisher_name'] ?? null;
370                 $media['publisher-image'] = $data['publisher_img'] ?? null;
371
372                 return $media;
373         }
374
375         /**
376          * Fetch media data from local resources
377          * @param array $media
378          * @return array media with added data
379          */
380         private static function fetchLocalData(array $media): array
381         {
382                 if (!preg_match('|.*?/photo/(.*[a-fA-F0-9])\-(.*[0-9])\..*[\w]|', $media['url'] ?? '', $matches)) {
383                         return $media;
384                 }
385                 $photo = Photo::selectFirst([], ['resource-id' => $matches[1], 'scale' => $matches[2]]);
386                 if (!empty($photo)) {
387                         $media['mimetype'] = $photo['type'];
388                         $media['size'] = $photo['datasize'];
389                         $media['width'] = $photo['width'];
390                         $media['height'] = $photo['height'];
391                         $media['blurhash'] = $photo['blurhash'];
392                 }
393
394                 if (!preg_match('|.*?/photo/(.*[a-fA-F0-9])\-(.*[0-9])\..*[\w]|', $media['preview'] ?? '', $matches)) {
395                         return $media;
396                 }
397                 $photo = Photo::selectFirst([], ['resource-id' => $matches[1], 'scale' => $matches[2]]);
398                 if (!empty($photo)) {
399                         $media['preview-width'] = $photo['width'];
400                         $media['preview-height'] = $photo['height'];
401                 }
402
403                 return $media;
404         }
405
406         /**
407          * Add the detected type to the media array
408          *
409          * @param array $data
410          * @return array data array with the detected type
411          */
412         public static function addType(array $data): array
413         {
414                 if (empty($data['mimetype'])) {
415                         Logger::info('No MimeType provided', ['media' => $data]);
416                         return $data;
417                 }
418
419                 $type = explode('/', current(explode(';', $data['mimetype'])));
420                 if (count($type) < 2) {
421                         Logger::info('Unknown MimeType', ['type' => $type, 'media' => $data]);
422                         $data['type'] = self::UNKNOWN;
423                         return $data;
424                 }
425
426                 $filetype = strtolower($type[0]);
427                 $subtype = strtolower($type[1]);
428
429                 if ($filetype == 'image') {
430                         $data['type'] = self::IMAGE;
431                 } elseif ($filetype == 'video') {
432                         $data['type'] = self::VIDEO;
433                 } elseif ($filetype == 'audio') {
434                         $data['type'] = self::AUDIO;
435                 } elseif (($filetype == 'text') && ($subtype == 'html')) {
436                         $data['type'] = self::HTML;
437                 } elseif (($filetype == 'text') && ($subtype == 'xml')) {
438                         $data['type'] = self::XML;
439                 } elseif (($filetype == 'text') && ($subtype == 'plain')) {
440                         $data['type'] = self::PLAIN;
441                 } elseif ($filetype == 'text') {
442                         $data['type'] = self::TEXT;
443                 } elseif (($filetype == 'application') && ($subtype == 'x-bittorrent')) {
444                         $data['type'] = self::TORRENT;
445                 } elseif ($filetype == 'application') {
446                         $data['type'] = self::APPLICATION;
447                 } else {
448                         $data['type'] = self::UNKNOWN;
449                         Logger::info('Unknown type', ['filetype' => $filetype, 'subtype' => $subtype, 'media' => $data]);
450                         return $data;
451                 }
452
453                 Logger::debug('Detected type', ['filetype' => $filetype, 'subtype' => $subtype, 'media' => $data]);
454                 return $data;
455         }
456
457         /**
458          * Tests for path patterns that are usef for picture links in Friendica
459          *
460          * @param string $page    Link to the image page
461          * @param string $preview Preview picture
462          * @return boolean
463          */
464         private static function isPictureLink(string $page, string $preview): bool
465         {
466                 return preg_match('#/photos/.*/image/#ism', $page) && preg_match('#/photo/.*-1\.#ism', $preview);
467         }
468
469         /**
470          * Add media links and remove them from the body
471          *
472          * @param integer $uriid
473          * @param string $body
474          * @return string Body without media links
475          */
476         public static function insertFromBody(int $uriid, string $body, bool $endmatch = false): string
477         {
478                 $endmatchpattern = $endmatch ? '\z' : '';
479                 // Simplify image codes
480                 $unshared_body = $body = preg_replace("/\[img\=([0-9]*)x([0-9]*)\](.*?)\[\/img\]$endmatchpattern/ism", '[img]$3[/img]', $body);
481
482                 $attachments = [];
483                 if (preg_match_all("#\[url=([^\]]+?)\]\s*\[img=([^\[\]]*)\]([^\[\]]*)\[\/img\]\s*\[/url\]$endmatchpattern#ism", $body, $pictures, PREG_SET_ORDER)) {
484                         foreach ($pictures as $picture) {
485                                 if (!self::isPictureLink($picture[1], $picture[2])) {
486                                         continue;
487                                 }
488                                 $body = str_replace($picture[0], '', $body);
489                                 $image = str_replace('-1.', '-0.', $picture[2]);
490                                 $attachments[$image] = [
491                                         'uri-id' => $uriid, 'type' => self::IMAGE, 'url' => $image,
492                                         'preview' => $picture[2], 'description' => $picture[3]
493                                 ];
494                         }
495                 }
496
497                 if (preg_match_all("/\[img=([^\[\]]*)\]([^\[\]]*)\[\/img\]$endmatchpattern/Usi", $body, $pictures, PREG_SET_ORDER)) {
498                         foreach ($pictures as $picture) {
499                                 $body = str_replace($picture[0], '', $body);
500                                 $attachments[$picture[1]] = ['uri-id' => $uriid, 'type' => self::IMAGE, 'url' => $picture[1], 'description' => $picture[2]];
501                         }
502                 }
503
504                 if (preg_match_all("#\[url=([^\]]+?)\]\s*\[img\]([^\[]+?)\[/img\]\s*\[/url\]$endmatchpattern#ism", $body, $pictures, PREG_SET_ORDER)) {
505                         foreach ($pictures as $picture) {
506                                 if (!self::isPictureLink($picture[1], $picture[2])) {
507                                         continue;
508                                 }
509                                 $body = str_replace($picture[0], '', $body);
510                                 $image = str_replace('-1.', '-0.', $picture[2]);
511                                 $attachments[$image] = [
512                                         'uri-id' => $uriid, 'type' => self::IMAGE, 'url' => $image,
513                                         'preview' => $picture[2], 'description' => null
514                                 ];
515                         }
516                 }
517
518                 if (preg_match_all("/\[img\]([^\[\]]*)\[\/img\]$endmatchpattern/ism", $body, $pictures, PREG_SET_ORDER)) {
519                         foreach ($pictures as $picture) {
520                                 $body = str_replace($picture[0], '', $body);
521                                 $attachments[$picture[1]] = ['uri-id' => $uriid, 'type' => self::IMAGE, 'url' => $picture[1]];
522                         }
523                 }
524
525                 if (preg_match_all("/\[audio\]([^\[\]]*)\[\/audio\]$endmatchpattern/ism", $body, $audios, PREG_SET_ORDER)) {
526                         foreach ($audios as $audio) {
527                                 $body = str_replace($audio[0], '', $body);
528                                 $attachments[$audio[1]] = ['uri-id' => $uriid, 'type' => self::AUDIO, 'url' => $audio[1]];
529                         }
530                 }
531
532                 if (preg_match_all("/\[video\]([^\[\]]*)\[\/video\]$endmatchpattern/ism", $body, $videos, PREG_SET_ORDER)) {
533                         foreach ($videos as $video) {
534                                 $body = str_replace($video[0], '', $body);
535                                 $attachments[$video[1]] = ['uri-id' => $uriid, 'type' => self::VIDEO, 'url' => $video[1]];
536                         }
537                 }
538
539                 if ($uriid != 0) {
540                         foreach ($attachments as $attachment) {
541                                 if (Post\Link::exists($uriid, $attachment['preview'] ?? $attachment['url'])) {
542                                         continue;
543                                 }
544
545                                 // Only store attachments that are part of the unshared body
546                                 if (Item::containsLink($unshared_body, $attachment['preview'] ?? $attachment['url'], $attachment['type'])) {
547                                         self::insert($attachment);
548                                 }
549                         }
550                 }
551
552                 return trim($body);
553         }
554
555         /**
556          * Remove media that is at the end of the body
557          *
558          * @param string $body
559          * @return string
560          */
561         public static function removeFromEndOfBody(string $body): string
562         {
563                 do {
564                         $prebody = $body;
565                         $body = self::insertFromBody(0, $body, true);
566                 } while ($prebody != $body);
567                 return $body;
568         }
569
570         /**
571          * Add media links from a relevant url in the body
572          *
573          * @param integer $uriid
574          * @param string $body
575          * @return void
576          */
577         public static function insertFromRelevantUrl(int $uriid, string $body, string $fullbody, string $network)
578         {
579                 // Remove all hashtags and mentions
580                 $body = preg_replace("/([#@!])\[url\=(.*?)\](.*?)\[\/url\]/ism", '', $body);
581
582                 // Search for pure links
583                 if (preg_match_all("/\[url\](https?:.*?)\[\/url\]/ism", $body, $matches)) {
584                         foreach ($matches[1] as $url) {
585                                 Logger::info('Got page url (link without description)', ['uri-id' => $uriid, 'url' => $url]);
586                                 $result = self::insert(['uri-id' => $uriid, 'type' => self::UNKNOWN, 'url' => $url], false, $network);
587                                 if ($result && ($network == Protocol::DFRN)) {
588                                         self::revertHTMLType($uriid, $url, $fullbody);
589                                         Logger::debug('Revert HTML type', ['uri-id' => $uriid, 'url' => $url]);
590                                 } elseif ($result) {
591                                         Logger::debug('Media had been added', ['uri-id' => $uriid, 'url' => $url]);
592                                 } else {
593                                         Logger::debug('Media had not been added', ['uri-id' => $uriid, 'url' => $url]);
594                                 }
595                         }
596                 }
597
598                 // Search for links with descriptions
599                 if (preg_match_all("/\[url\=(https?:.*?)\].*?\[\/url\]/ism", $body, $matches)) {
600                         foreach ($matches[1] as $url) {
601                                 Logger::info('Got page url (link with description)', ['uri-id' => $uriid, 'url' => $url]);
602                                 $result = self::insert(['uri-id' => $uriid, 'type' => self::UNKNOWN, 'url' => $url], false, $network);
603                                 if ($result && ($network == Protocol::DFRN)) {
604                                         self::revertHTMLType($uriid, $url, $fullbody);
605                                         Logger::debug('Revert HTML type', ['uri-id' => $uriid, 'url' => $url]);
606                                 } elseif ($result) {
607                                         Logger::debug('Media has been added', ['uri-id' => $uriid, 'url' => $url]);
608                                 } else {
609                                         Logger::debug('Media has not been added', ['uri-id' => $uriid, 'url' => $url]);
610                                 }
611                         }
612                 }
613         }
614
615         /**
616          * Revert the media type of links to UNKNOWN for DFRN posts when they aren't attached
617          *
618          * @param integer $uriid
619          * @param string $url
620          * @param string $body
621          * @return void
622          */
623         private static function revertHTMLType(int $uriid, string $url, string $body)
624         {
625                 $attachment = BBCode::getAttachmentData($body);
626                 if (!empty($attachment['url']) && Network::getUrlMatch($attachment['url'], $url)) {
627                         return;
628                 }
629                 DBA::update('post-media', ['type' => self::UNKNOWN], ['uri-id' => $uriid, 'type' => self::HTML, 'url' => $url]);
630         }
631
632         /**
633          * Add media links from the attachment field
634          *
635          * @param integer $uriid
636          * @param string $body
637          * @return void
638          */
639         public static function insertFromAttachmentData(int $uriid, string $body)
640         {
641                 $data = BBCode::getAttachmentData($body);
642                 if (empty($data)) {
643                         return;
644                 }
645
646                 Logger::info('Adding attachment data', ['data' => $data]);
647                 $attachment = [
648                         'uri-id' => $uriid,
649                         'type' => self::HTML,
650                         'url' => $data['url'],
651                         'preview' => $data['preview'] ?? null,
652                         'description' => $data['description'] ?? null,
653                         'name' => $data['title'] ?? null,
654                         'author-url' => $data['author_url'] ?? null,
655                         'author-name' => $data['author_name'] ?? null,
656                         'publisher-url' => $data['provider_url'] ?? null,
657                         'publisher-name' => $data['provider_name'] ?? null,
658                 ];
659                 if (!empty($data['image'])) {
660                         $attachment['preview'] = $data['image'];
661                 }
662                 self::insert($attachment);
663         }
664
665         /**
666          * Add media links from the attach field
667          *
668          * @param integer $uriid
669          * @param string $attach
670          * @return void
671          */
672         public static function insertFromAttachment(int $uriid, string $attach)
673         {
674                 if (!preg_match_all('|\[attach\]href=\"(.*?)\" length=\"(.*?)\" type=\"(.*?)\"(?: title=\"(.*?)\")?|', $attach, $matches, PREG_SET_ORDER)) {
675                         return;
676                 }
677
678                 foreach ($matches as $attachment) {
679                         $media['type'] = self::DOCUMENT;
680                         $media['uri-id'] = $uriid;
681                         $media['url'] = $attachment[1];
682                         $media['size'] = $attachment[2];
683                         $media['mimetype'] = $attachment[3];
684                         $media['description'] = $attachment[4] ?? '';
685
686                         self::insert($media);
687                 }
688         }
689
690         /**
691          * Retrieves the media attachments associated with the provided item ID.
692          *
693          * @param int $uri_id URI id
694          * @param array $types Media types
695          * @return array|bool Array on success, false on error
696          * @throws \Exception
697          */
698         public static function getByURIId(int $uri_id, array $types = [])
699         {
700                 $condition = ["`uri-id` = ? AND `type` != ?", $uri_id, self::UNKNOWN];
701
702                 if (!empty($types)) {
703                         $condition = DBA::mergeConditions($condition, ['type' => $types]);
704                 }
705
706                 return DBA::selectToArray('post-media', [], $condition, ['order' => ['id']]);
707         }
708
709         /**
710          * Checks if media attachments are associated with the provided item ID.
711          *
712          * @param int $uri_id URI id
713          * @param array $types Media types
714          * @return bool Whether media attachment exists
715          * @throws \Exception
716          */
717         public static function existsByURIId(int $uri_id, array $types = []): bool
718         {
719                 $condition = ["`uri-id` = ? AND `type` != ?", $uri_id, self::UNKNOWN];
720
721                 if (!empty($types)) {
722                         $condition = DBA::mergeConditions($condition, ['type' => $types]);
723                 }
724
725                 return DBA::exists('post-media', $condition);
726         }
727
728         /**
729          * Delete media by uri-id and media type
730          *
731          * @param int $uri_id URI id
732          * @param array $types Media types
733          * @return bool Whether media attachment exists
734          * @throws \Exception
735          */
736         public static function deleteByURIId(int $uri_id, array $types = []): bool
737         {
738                 $condition = ['uri-id' => $uri_id];
739
740                 if (!empty($types)) {
741                         $condition = DBA::mergeConditions($condition, ['type' => $types]);
742                 }
743
744                 return DBA::delete('post-media', $condition);
745         }
746
747         /**
748          * Split the attachment media in the three segments "visual", "link" and "additional"
749          *
750          * @param int    $uri_id URI id
751          * @param array  $links list of links that shouldn't be added
752          * @param bool   $has_media
753          * @return array attachments
754          */
755         public static function splitAttachments(int $uri_id, array $links = [], bool $has_media = true): array
756         {
757                 $attachments = ['visual' => [], 'link' => [], 'additional' => []];
758
759                 if (!$has_media) {
760                         return $attachments;
761                 }
762
763                 $media = self::getByURIId($uri_id);
764                 if (empty($media)) {
765                         return $attachments;
766                 }
767
768                 $heights = [];
769                 $selected = '';
770                 $previews = [];
771
772                 foreach ($media as $medium) {
773                         foreach ($links as $link) {
774                                 if (Strings::compareLink($link, $medium['url'])) {
775                                         continue 2;
776                                 }
777                         }
778
779                         // Avoid adding separate media entries for previews
780                         foreach ($previews as $preview) {
781                                 if (Strings::compareLink($preview, $medium['url'])) {
782                                         continue 2;
783                                 }
784                         }
785
786                         // Currently these two types are ignored here.
787                         // Posts are added differently and contacts are not displayed as attachments.
788                         if (in_array($medium['type'], [self::ACCOUNT, self::ACTIVITY])) {
789                                 continue;
790                         }
791
792                         if (!empty($medium['preview'])) {
793                                 $previews[] = $medium['preview'];
794                         }
795
796                         $type = explode('/', explode(';', $medium['mimetype'] ?? '')[0]);
797                         if (count($type) < 2) {
798                                 Logger::info('Unknown MimeType', ['type' => $type, 'media' => $medium]);
799                                 $filetype = 'unkn';
800                                 $subtype = 'unkn';
801                         } else {
802                                 $filetype = strtolower($type[0]);
803                                 $subtype = strtolower($type[1]);
804                         }
805
806                         $medium['filetype'] = $filetype;
807                         $medium['subtype'] = $subtype;
808
809                         if ($medium['type'] == self::HTML || (($filetype == 'text') && ($subtype == 'html'))) {
810                                 $attachments['link'][] = $medium;
811                                 continue;
812                         }
813
814                         if (
815                                 in_array($medium['type'], [self::AUDIO, self::IMAGE]) ||
816                                 in_array($filetype, ['audio', 'image'])
817                         ) {
818                                 $attachments['visual'][] = $medium;
819                         } elseif (($medium['type'] == self::VIDEO) || ($filetype == 'video')) {
820                                 if (!empty($medium['height'])) {
821                                         // Peertube videos are delivered in many different resolutions. We pick a moderate one.
822                                         // Since only Peertube provides a "height" parameter, this wouldn't be executed
823                                         // when someone for example on Mastodon was sharing multiple videos in a single post.
824                                         $heights[$medium['height']] = $medium['url'];
825                                         $video[$medium['url']] = $medium;
826                                 } else {
827                                         $attachments['visual'][] = $medium;
828                                 }
829                         } else {
830                                 $attachments['additional'][] = $medium;
831                         }
832                 }
833
834                 if (!empty($heights)) {
835                         ksort($heights);
836                         foreach ($heights as $height => $url) {
837                                 if (empty($selected) || $height <= 480) {
838                                         $selected = $url;
839                                 }
840                         }
841
842                         if (!empty($selected)) {
843                                 $attachments['visual'][] = $video[$selected];
844                                 unset($video[$selected]);
845                                 foreach ($video as $element) {
846                                         $attachments['additional'][] = $element;
847                                 }
848                         }
849                 }
850
851                 return $attachments;
852         }
853
854         /**
855          * Add media attachments to the body
856          *
857          * @param int    $uriid
858          * @param string $body
859          * @param array  $types
860          *
861          * @return string body
862          */
863         public static function addAttachmentsToBody(int $uriid, string $body = '', array $types = [self::IMAGE, self::AUDIO, self::VIDEO]): string
864         {
865                 if (empty($body)) {
866                         $item = Post::selectFirst(['body'], ['uri-id' => $uriid]);
867                         if (!DBA::isResult($item)) {
868                                 return '';
869                         }
870                         $body = $item['body'];
871                 }
872                 $original_body = $body;
873
874                 $body = BBCode::removeAttachment($body);
875
876                 foreach (self::getByURIId($uriid, $types) as $media) {
877                         if (Item::containsLink($body, $media['preview'] ?? $media['url'], $media['type'])) {
878                                 continue;
879                         }
880
881                         if ($media['type'] == self::IMAGE) {
882                                 if (!empty($media['preview'])) {
883                                         if (!empty($media['description'])) {
884                                                 $body .= "\n[url=" . $media['url'] . "][img=" . $media['preview'] . ']' . $media['description'] . '[/img][/url]';
885                                         } else {
886                                                 $body .= "\n[url=" . $media['url'] . "][img]" . $media['preview'] . '[/img][/url]';
887                                         }
888                                 } else {
889                                         if (!empty($media['description'])) {
890                                                 $body .= "\n[img=" . $media['url'] . ']' . $media['description'] . '[/img]';
891                                         } else {
892                                                 $body .= "\n[img]" . $media['url'] . '[/img]';
893                                         }
894                                 }
895                         } elseif ($media['type'] == self::AUDIO) {
896                                 $body .= "\n[audio]" . $media['url'] . "[/audio]\n";
897                         } elseif ($media['type'] == self::VIDEO) {
898                                 $body .= "\n[video]" . $media['url'] . "[/video]\n";
899                         }
900                 }
901
902                 if (preg_match("/.*(\[attachment.*?\].*?\[\/attachment\]).*/ism", $original_body, $match)) {
903                         $body .= "\n" . $match[1];
904                 }
905
906                 return $body;
907         }
908
909         /**
910          * Add an [attachment] element to the body for a given uri-id with a HTML media element
911          *
912          * @param integer $uriid
913          * @param string $body
914          * @return string
915          */
916         public static function addHTMLAttachmentToBody(int $uriid, string $body): string
917         {
918                 if (preg_match("/.*(\[attachment.*?\].*?\[\/attachment\]).*/ism", $body, $match)) {
919                         return $body;
920                 }
921
922                 $links = self::getByURIId($uriid, [self::HTML]);
923                 if (empty($links)) {
924                         return $body;
925                 }
926
927                 $data = [
928                         'type' => 'link',
929                         'url'  => $links[0]['url'],
930                         'title' => $links[0]['name'],
931                         'text' => $links[0]['description'],
932                         'publisher_name' => $links[0]['publisher-name'],
933                         'publisher_url' => $links[0]['publisher-url'],
934                         'publisher_img' => $links[0]['publisher-image'],
935                         'author_name' => $links[0]['author-name'],
936                         'author_url' => $links[0]['author-url'],
937                         'author_img' => $links[0]['author-image'],
938                         'images' => [[
939                                 'src' => $links[0]['preview'],
940                                 'height' => $links[0]['preview-height'],
941                                 'width' => $links[0]['preview-width'],
942                         ]]
943                 ];
944                 $body .= "\n" . PageInfo::getFooterFromData($data);
945
946                 return $body;
947         }
948
949         /**
950          * Add a link to the body for a given uri-id with a HTML media element
951          *
952          * @param integer $uriid
953          * @param string $body
954          * @return string
955          */
956         public static function addHTMLLinkToBody(int $uriid, string $body): string
957         {
958                 $links = self::getByURIId($uriid, [self::HTML]);
959                 if (empty($links)) {
960                         return $body;
961                 }
962
963                 if (strpos($body, $links[0]['url'])) {
964                         return $body;
965                 }
966
967                 if (!empty($links[0]['name']) && ($links[0]['name'] != $links[0]['url'])) {
968                         return $body . "\n[url=" . $links[0]['url'] . ']' . $links[0]['name'] . "[/url]";
969                 } else {
970                         return $body . "\n[url]" . $links[0]['url'] . "[/url]";
971                 }
972         }
973
974         /**
975          * Add an [attachment] element to the body and a link to raw-body for a given uri-id with a HTML media element
976          *
977          * @param array $item
978          * @return array
979          */
980         public static function addHTMLAttachmentToItem(array $item): array
981         {
982                 if (($item['gravity'] == Item::GRAVITY_ACTIVITY) || empty($item['uri-id'])) {
983                         return $item;
984                 }
985
986                 $item['body'] = self::addHTMLAttachmentToBody($item['uri-id'], $item['body']);
987
988                 if (!empty($item['raw-body'])) {
989                         $item['raw-body'] = self::addHTMLLinkToBody($item['uri-id'], $item['raw-body']);
990                 }
991
992                 return $item;
993         }
994
995         /**
996          * Get preview link for given media id
997          *
998          * @param integer $id   media id
999          * @param string  $size One of the Proxy::SIZE_* constants
1000          * @return string preview link
1001          */
1002         public static function getPreviewUrlForId(int $id, string $size = ''): string
1003         {
1004                 $url = DI::baseUrl() . '/photo/preview/';
1005                 switch ($size) {
1006                         case Proxy::SIZE_MICRO:
1007                                 $url .= Proxy::PIXEL_MICRO . '/';
1008                                 break;
1009                         case Proxy::SIZE_THUMB:
1010                                 $url .= Proxy::PIXEL_THUMB . '/';
1011                                 break;
1012                         case Proxy::SIZE_SMALL:
1013                                 $url .= Proxy::PIXEL_SMALL . '/';
1014                                 break;
1015                         case Proxy::SIZE_MEDIUM:
1016                                 $url .= Proxy::PIXEL_MEDIUM . '/';
1017                                 break;
1018                         case Proxy::SIZE_LARGE:
1019                                 $url .= Proxy::PIXEL_LARGE . '/';
1020                                 break;
1021                 }
1022                 return $url . $id;
1023         }
1024
1025         /**
1026          * Get media link for given media id
1027          *
1028          * @param integer $id   media id
1029          * @param string  $size One of the Proxy::SIZE_* constants
1030          * @return string media link
1031          */
1032         public static function getUrlForId(int $id, string $size = ''): string
1033         {
1034                 $url = DI::baseUrl() . '/photo/media/';
1035                 switch ($size) {
1036                         case Proxy::SIZE_MICRO:
1037                                 $url .= Proxy::PIXEL_MICRO . '/';
1038                                 break;
1039                         case Proxy::SIZE_THUMB:
1040                                 $url .= Proxy::PIXEL_THUMB . '/';
1041                                 break;
1042                         case Proxy::SIZE_SMALL:
1043                                 $url .= Proxy::PIXEL_SMALL . '/';
1044                                 break;
1045                         case Proxy::SIZE_MEDIUM:
1046                                 $url .= Proxy::PIXEL_MEDIUM . '/';
1047                                 break;
1048                         case Proxy::SIZE_LARGE:
1049                                 $url .= Proxy::PIXEL_LARGE . '/';
1050                                 break;
1051                 }
1052                 return $url . $id;
1053         }
1054 }