friendica/src/Util/JsonLD.php

265 lines
7.2 KiB
PHP
Raw Normal View History

<?php
/**
2021-03-29 02:40:20 -04:00
* @copyright Copyright (C) 2010-2021, the Friendica project
*
* @license GNU AGPL version 3 or any later version
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as
* published by the Free Software Foundation, either version 3 of the
* License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see <https://www.gnu.org/licenses/>.
*
*/
namespace Friendica\Util;
use Friendica\Core\Cache\Duration;
2018-10-29 17:20:46 -04:00
use Friendica\Core\Logger;
2018-09-26 18:45:13 -04:00
use Exception;
use Friendica\DI;
/**
2020-01-19 01:05:23 -05:00
* This class contain methods to work with JsonLD data
*/
class JsonLD
{
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Loader for LD-JSON validation
2018-09-26 18:02:14 -04:00
*
* @param $url
*
2019-01-06 16:06:53 -05:00
* @return mixed the loaded data
* @throws \JsonLdException
2018-09-26 18:02:14 -04:00
*/
public static function documentLoader($url)
{
switch ($url) {
case 'https://w3id.org/security/v1':
$url = DI::baseUrl() . '/static/security-v1.jsonld';
break;
case 'https://w3id.org/identity/v1':
$url = DI::baseUrl() . '/static/identity-v1.jsonld';
break;
case 'https://www.w3.org/ns/activitystreams':
$url = DI::baseUrl() . '/static/activitystreams.jsonld';
break;
default:
Logger::info('Got url', ['url' =>$url]);
break;
}
$recursion = 0;
$x = debug_backtrace();
if ($x) {
foreach ($x as $n) {
if ($n['function'] === __FUNCTION__) {
$recursion ++;
}
}
}
if ($recursion > 5) {
Logger::error('jsonld bomb detected at: ' . $url);
exit();
}
$result = DI::cache()->get('documentLoader:' . $url);
if (!is_null($result)) {
return $result;
}
$data = jsonld_default_document_loader($url);
DI::cache()->set('documentLoader:' . $url, $data, Duration::DAY);
return $data;
}
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Normalises a given JSON array
2018-09-26 18:02:14 -04:00
*
* @param array $json
*
2019-01-06 16:06:53 -05:00
* @return mixed|bool normalized JSON string
* @throws Exception
2018-09-26 18:02:14 -04:00
*/
public static function normalize($json)
{
jsonld_set_document_loader('Friendica\Util\JsonLD::documentLoader');
$jsonobj = json_decode(json_encode($json, JSON_UNESCAPED_SLASHES | JSON_UNESCAPED_UNICODE));
2018-09-26 18:45:13 -04:00
try {
$normalized = jsonld_normalize($jsonobj, array('algorithm' => 'URDNA2015', 'format' => 'application/nquads'));
}
catch (Exception $e) {
2018-10-02 04:31:58 -04:00
$normalized = false;
$messages = [];
$currentException = $e;
do {
$messages[] = $currentException->getMessage();
} while($currentException = $currentException->getPrevious());
Logger::warning('JsonLD normalize error');
Logger::notice('JsonLD normalize error', ['messages' => $messages]);
Logger::info('JsonLD normalize error', ['trace' => $e->getTraceAsString()]);
Logger::debug('JsonLD normalize error', ['jsonobj' => $jsonobj]);
2018-09-26 18:45:13 -04:00
}
return $normalized;
}
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Compacts a given JSON array
2018-09-26 18:02:14 -04:00
*
* @param array $json
*
2019-01-06 16:06:53 -05:00
* @return array Compacted JSON array
* @throws Exception
2018-09-26 18:02:14 -04:00
*/
public static function compact($json)
{
jsonld_set_document_loader('Friendica\Util\JsonLD::documentLoader');
2018-10-07 09:37:05 -04:00
$context = (object)['as' => 'https://www.w3.org/ns/activitystreams#',
'w3id' => 'https://w3id.org/security#',
'ldp' => (object)['@id' => 'http://www.w3.org/ns/ldp#', '@type' => '@id'],
'vcard' => (object)['@id' => 'http://www.w3.org/2006/vcard/ns#', '@type' => '@id'],
'dfrn' => (object)['@id' => 'http://purl.org/macgirvin/dfrn/1.0/', '@type' => '@id'],
2018-10-07 09:37:05 -04:00
'diaspora' => (object)['@id' => 'https://diasporafoundation.org/ns/', '@type' => '@id'],
'ostatus' => (object)['@id' => 'http://ostatus.org#', '@type' => '@id'],
'dc' => (object)['@id' => 'http://purl.org/dc/terms/', '@type' => '@id'],
'toot' => (object)['@id' => 'http://joinmastodon.org/ns#', '@type' => '@id'],
2020-03-02 02:57:23 -05:00
'litepub' => (object)['@id' => 'http://litepub.social/ns#', '@type' => '@id'],
'sc' => (object)['@id' => 'http://schema.org#', '@type' => '@id'],
'pt' => (object)['@id' => 'https://joinpeertube.org/ns#', '@type' => '@id']];
// Preparation for adding possibly missing content to the context
if (!empty($json['@context']) && is_string($json['@context'])) {
$json['@context'] = [$json['@context']];
}
// Workaround for servers with missing context
// See issue https://github.com/nextcloud/social/issues/330
if (!empty($json['@context']) && is_array($json['@context'])) {
$json['@context'][] = 'https://w3id.org/security/v1';
}
// Trying to avoid memory problems with large content fields
if (!empty($json['object']['source']['content'])) {
$content = $json['object']['source']['content'];
$json['object']['source']['content'] = '';
}
$jsonobj = json_decode(json_encode($json, JSON_UNESCAPED_SLASHES | JSON_UNESCAPED_UNICODE));
try {
$compacted = jsonld_compact($jsonobj, $context);
}
catch (Exception $e) {
$compacted = false;
Logger::notice('compacting error', ['line' => $e->getLine(), 'exception' => $e]);
}
$json = json_decode(json_encode($compacted, JSON_UNESCAPED_SLASHES | JSON_UNESCAPED_UNICODE), true);
if (isset($json['as:object']['as:source']['as:content']) && !empty($content)) {
$json['as:object']['as:source']['as:content'] = $content;
}
return $json;
}
2018-09-20 01:37:01 -04:00
2018-10-07 09:37:05 -04:00
/**
2020-01-19 01:05:23 -05:00
* Fetches an element array from a JSON array
2018-10-07 09:37:05 -04:00
*
* @param $array
* @param $element
* @param $key
*
2019-01-06 16:06:53 -05:00
* @return array fetched element
2018-10-07 09:37:05 -04:00
*/
public static function fetchElementArray($array, $element, $key = null, $type = null, $type_value = null)
2018-10-07 09:37:05 -04:00
{
if (!isset($array[$element])) {
return null;
}
// If it isn't an array yet, make it to one
2021-08-12 09:12:41 -04:00
if (!is_array($array[$element]) || !is_int(key($array[$element]))) {
2018-10-07 09:37:05 -04:00
$array[$element] = [$array[$element]];
}
$elements = [];
foreach ($array[$element] as $entry) {
if (!is_array($entry) || is_null($key)) {
$item = $entry;
} elseif (isset($entry[$key])) {
$item = $entry[$key];
}
if (isset($item) && (is_null($type) || is_null($type_value) || isset($item[$type]) && $item[$type] == $type_value)) {
$elements[] = $item;
2018-10-07 09:37:05 -04:00
}
}
return $elements;
}
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Fetches an element from a JSON array
2018-09-26 18:02:14 -04:00
*
* @param $array
* @param $element
* @param $key
* @param $type
* @param $type_value
*
2019-01-06 16:06:53 -05:00
* @return string fetched element
2018-09-26 18:02:14 -04:00
*/
2018-10-07 09:37:05 -04:00
public static function fetchElement($array, $element, $key = '@id', $type = null, $type_value = null)
2018-09-20 01:37:01 -04:00
{
if (empty($array)) {
2018-10-07 09:37:05 -04:00
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
if (!isset($array[$element])) {
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
if (!is_array($array[$element])) {
2018-09-20 01:37:01 -04:00
return $array[$element];
}
2018-10-07 09:37:05 -04:00
if (is_null($type) || is_null($type_value)) {
$element_array = self::fetchElementArray($array, $element, $key);
if (is_null($element_array)) {
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
return array_shift($element_array);
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
$element_array = self::fetchElementArray($array, $element);
if (is_null($element_array)) {
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
foreach ($element_array as $entry) {
if (isset($entry[$key]) && isset($entry[$type]) && ($entry[$type] == $type_value)) {
return $entry[$key];
}
}
2018-09-20 01:37:01 -04:00
2018-10-07 09:37:05 -04:00
return null;
2018-09-20 01:37:01 -04:00
}
}