friendica/src/Util/JsonLD.php

252 lines
6.6 KiB
PHP
Raw Normal View History

<?php
/**
* @copyright Copyright (C) 2020, Friendica
*
* @license GNU AGPL version 3 or any later version
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as
* published by the Free Software Foundation, either version 3 of the
* License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see <https://www.gnu.org/licenses/>.
*
*/
namespace Friendica\Util;
use Friendica\Core\Cache\Duration;
2018-10-29 17:20:46 -04:00
use Friendica\Core\Logger;
2018-09-26 18:45:13 -04:00
use Exception;
use Friendica\DI;
/**
2020-01-19 01:05:23 -05:00
* This class contain methods to work with JsonLD data
*/
class JsonLD
{
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Loader for LD-JSON validation
2018-09-26 18:02:14 -04:00
*
* @param $url
*
2019-01-06 16:06:53 -05:00
* @return mixed the loaded data
* @throws \JsonLdException
2018-09-26 18:02:14 -04:00
*/
public static function documentLoader($url)
{
$recursion = 0;
$x = debug_backtrace();
if ($x) {
foreach ($x as $n) {
if ($n['function'] === __FUNCTION__) {
$recursion ++;
}
}
}
if ($recursion > 5) {
Logger::error('jsonld bomb detected at: ' . $url);
exit();
}
$result = DI::cache()->get('documentLoader:' . $url);
if (!is_null($result)) {
return $result;
}
$data = jsonld_default_document_loader($url);
DI::cache()->set('documentLoader:' . $url, $data, Duration::DAY);
return $data;
}
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Normalises a given JSON array
2018-09-26 18:02:14 -04:00
*
* @param array $json
*
2019-01-06 16:06:53 -05:00
* @return mixed|bool normalized JSON string
* @throws Exception
2018-09-26 18:02:14 -04:00
*/
public static function normalize($json)
{
jsonld_set_document_loader('Friendica\Util\JsonLD::documentLoader');
$jsonobj = json_decode(json_encode($json, JSON_UNESCAPED_SLASHES | JSON_UNESCAPED_UNICODE));
2018-09-26 18:45:13 -04:00
try {
$normalized = jsonld_normalize($jsonobj, array('algorithm' => 'URDNA2015', 'format' => 'application/nquads'));
}
catch (Exception $e) {
2018-10-02 04:31:58 -04:00
$normalized = false;
$messages = [];
$currentException = $e;
do {
$messages[] = $currentException->getMessage();
} while($currentException = $currentException->getPrevious());
Logger::warning('JsonLD normalize error');
Logger::notice('JsonLD normalize error', ['messages' => $messages]);
Logger::info('JsonLD normalize error', ['trace' => $e->getTraceAsString()]);
Logger::debug('JsonLD normalize error', ['jsonobj' => $jsonobj]);
2018-09-26 18:45:13 -04:00
}
return $normalized;
}
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Compacts a given JSON array
2018-09-26 18:02:14 -04:00
*
* @param array $json
*
2019-01-06 16:06:53 -05:00
* @return array Compacted JSON array
* @throws Exception
2018-09-26 18:02:14 -04:00
*/
public static function compact($json)
{
jsonld_set_document_loader('Friendica\Util\JsonLD::documentLoader');
2018-10-07 09:37:05 -04:00
$context = (object)['as' => 'https://www.w3.org/ns/activitystreams#',
'w3id' => 'https://w3id.org/security#',
'ldp' => (object)['@id' => 'http://www.w3.org/ns/ldp#', '@type' => '@id'],
'vcard' => (object)['@id' => 'http://www.w3.org/2006/vcard/ns#', '@type' => '@id'],
'dfrn' => (object)['@id' => 'http://purl.org/macgirvin/dfrn/1.0/', '@type' => '@id'],
2018-10-07 09:37:05 -04:00
'diaspora' => (object)['@id' => 'https://diasporafoundation.org/ns/', '@type' => '@id'],
'ostatus' => (object)['@id' => 'http://ostatus.org#', '@type' => '@id'],
'dc' => (object)['@id' => 'http://purl.org/dc/terms/', '@type' => '@id'],
'toot' => (object)['@id' => 'http://joinmastodon.org/ns#', '@type' => '@id'],
'litepub' => (object)['@id' => 'http://litepub.social/ns#', '@type' => '@id']];
// Preparation for adding possibly missing content to the context
if (!empty($json['@context']) && is_string($json['@context'])) {
$json['@context'] = [$json['@context']];
}
// Workaround for servers with missing context
// See issue https://github.com/nextcloud/social/issues/330
2019-01-13 13:03:13 -05:00
if (!empty($json['@context']) && is_array($json['@context'])) {
2019-01-13 11:00:27 -05:00
$json['@context'][] = 'https://w3id.org/security/v1';
}
// Trying to avoid memory problems with large content fields
if (!empty($json['object']['source']['content'])) {
$content = $json['object']['source']['content'];
$json['object']['source']['content'] = '';
}
$jsonobj = json_decode(json_encode($json, JSON_UNESCAPED_SLASHES | JSON_UNESCAPED_UNICODE));
try {
$compacted = jsonld_compact($jsonobj, $context);
}
catch (Exception $e) {
$compacted = false;
Logger::error('compacting error');
// Sooner or later we should log some details as well - but currently this leads to memory issues
// Logger::log('compacting error:' . substr(print_r($e, true), 0, 10000), Logger::DEBUG);
}
$json = json_decode(json_encode($compacted, JSON_UNESCAPED_SLASHES | JSON_UNESCAPED_UNICODE), true);
if (isset($json['as:object']['as:source']['as:content']) && !empty($content)) {
$json['as:object']['as:source']['as:content'] = $content;
}
return $json;
}
2018-09-20 01:37:01 -04:00
2018-10-07 09:37:05 -04:00
/**
2020-01-19 01:05:23 -05:00
* Fetches an element array from a JSON array
2018-10-07 09:37:05 -04:00
*
* @param $array
* @param $element
* @param $key
*
2019-01-06 16:06:53 -05:00
* @return array fetched element
2018-10-07 09:37:05 -04:00
*/
public static function fetchElementArray($array, $element, $key = '@id')
{
if (empty($array)) {
return null;
}
if (!isset($array[$element])) {
return null;
}
// If it isn't an array yet, make it to one
if (!is_int(key($array[$element]))) {
$array[$element] = [$array[$element]];
}
$elements = [];
foreach ($array[$element] as $entry) {
if (!is_array($entry)) {
$elements[] = $entry;
} elseif (isset($entry[$key])) {
2018-10-07 09:37:05 -04:00
$elements[] = $entry[$key];
} elseif (!empty($entry) || !is_array($entry)) {
2018-10-07 09:37:05 -04:00
$elements[] = $entry;
}
}
return $elements;
}
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Fetches an element from a JSON array
2018-09-26 18:02:14 -04:00
*
* @param $array
* @param $element
* @param $key
* @param $type
* @param $type_value
*
2019-01-06 16:06:53 -05:00
* @return string fetched element
2018-09-26 18:02:14 -04:00
*/
2018-10-07 09:37:05 -04:00
public static function fetchElement($array, $element, $key = '@id', $type = null, $type_value = null)
2018-09-20 01:37:01 -04:00
{
if (empty($array)) {
2018-10-07 09:37:05 -04:00
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
if (!isset($array[$element])) {
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
if (!is_array($array[$element])) {
2018-09-20 01:37:01 -04:00
return $array[$element];
}
2018-10-07 09:37:05 -04:00
if (is_null($type) || is_null($type_value)) {
$element_array = self::fetchElementArray($array, $element, $key);
if (is_null($element_array)) {
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
return array_shift($element_array);
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
$element_array = self::fetchElementArray($array, $element);
if (is_null($element_array)) {
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
foreach ($element_array as $entry) {
if (isset($entry[$key]) && isset($entry[$type]) && ($entry[$type] == $type_value)) {
return $entry[$key];
}
}
2018-09-20 01:37:01 -04:00
2018-10-07 09:37:05 -04:00
return null;
2018-09-20 01:37:01 -04:00
}
}