friendica/src/Util/JsonLD.php

313 lines
8.4 KiB
PHP
Raw Normal View History

<?php
/**
2021-03-29 02:40:20 -04:00
* @copyright Copyright (C) 2010-2021, the Friendica project
*
* @license GNU AGPL version 3 or any later version
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as
* published by the Free Software Foundation, either version 3 of the
* License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see <https://www.gnu.org/licenses/>.
*
*/
namespace Friendica\Util;
use Friendica\Core\Cache\Duration;
2018-10-29 17:20:46 -04:00
use Friendica\Core\Logger;
2018-09-26 18:45:13 -04:00
use Exception;
use Friendica\Core\System;
use Friendica\DI;
use Friendica\Protocol\ActivityPub;
/**
2020-01-19 01:05:23 -05:00
* This class contain methods to work with JsonLD data
*/
class JsonLD
{
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Loader for LD-JSON validation
2018-09-26 18:02:14 -04:00
*
* @param $url
*
2019-01-06 16:06:53 -05:00
* @return mixed the loaded data
* @throws \JsonLdException
2018-09-26 18:02:14 -04:00
*/
public static function documentLoader($url)
{
$recursion = 0;
$x = debug_backtrace();
if ($x) {
foreach ($x as $n) {
if ($n['function'] === __FUNCTION__) {
$recursion ++;
}
}
}
if ($recursion > 5) {
Logger::error('jsonld bomb detected at: ' . $url);
exit();
}
$result = DI::cache()->get('documentLoader:' . $url);
if (!is_null($result)) {
return $result;
}
$data = jsonld_default_document_loader($url);
DI::cache()->set('documentLoader:' . $url, $data, Duration::DAY);
return $data;
}
public static function removeSecurityLink(array $json)
{
if (!is_array($json['@context'])) {
return $json;
}
if (($key = array_search('https://w3id.org/security/v1', $json['@context'])) !== false) {
unset($json['@context'][$key]);
$json['@context'] = array_values(array_filter($json['@context']));
}
return $json;
}
2021-05-16 10:32:06 -04:00
public static function fixContext(array $json)
{
// Preparation for adding possibly missing content to the context
if (!empty($json['@context']) && is_string($json['@context'])) {
$json['@context'] = [$json['@context']];
}
if (($key = array_search('https://w3id.org/security/v1', $json['@context'])) !== false) {
unset($json['@context'][$key]);
$json['@context'] = array_values(array_filter($json['@context']));
}
$last_entry = count($json['@context']) - 1;
$additional = [
'w3id' => 'https://w3id.org/security#',
'signature' => 'w3id:signature',
'RsaSignature2017' => 'w3id:RsaSignature2017',
'created' => 'w3id:created',
'creator' => 'w3id:creator',
'nonce' => 'w3id:nonce',
'signatureValue' => 'w3id:signatureValue',
'publicKey' => 'w3id:publicKey',
'publicKeyPem' => 'w3id:publicKeyPem'];
if (is_array($json['@context'][$last_entry])) {
$json['@context'][$last_entry] = array_merge($json['@context'][$last_entry], $additional);
} else {
$json['@context'][] = $additional;
}
return $json;
}
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Normalises a given JSON array
2018-09-26 18:02:14 -04:00
*
* @param array $json
*
2019-01-06 16:06:53 -05:00
* @return mixed|bool normalized JSON string
* @throws Exception
2018-09-26 18:02:14 -04:00
*/
public static function normalize($json)
{
$json = self::removeSecurityLink($json);
2021-05-16 10:32:06 -04:00
jsonld_set_document_loader('Friendica\Util\JsonLD::documentLoader');
$jsonobj = json_decode(json_encode($json, JSON_UNESCAPED_SLASHES | JSON_UNESCAPED_UNICODE));
2018-09-26 18:45:13 -04:00
try {
$normalized = jsonld_normalize($jsonobj, array('algorithm' => 'URDNA2015', 'format' => 'application/nquads'));
}
catch (Exception $e) {
2018-10-02 04:31:58 -04:00
$normalized = false;
$messages = [];
$currentException = $e;
do {
$messages[] = $currentException->getMessage();
} while($currentException = $currentException->getPrevious());
Logger::warning('JsonLD normalize error');
Logger::notice('JsonLD normalize error', ['messages' => $messages]);
Logger::info('JsonLD normalize error', ['trace' => $e->getTraceAsString()]);
Logger::debug('JsonLD normalize error', ['jsonobj' => $jsonobj]);
2018-09-26 18:45:13 -04:00
}
return $normalized;
}
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Compacts a given JSON array
2018-09-26 18:02:14 -04:00
*
* @param array $json
*
2019-01-06 16:06:53 -05:00
* @return array Compacted JSON array
* @throws Exception
2018-09-26 18:02:14 -04:00
*/
public static function compact($json)
{
$context = $json['@context'] ?? [];
$json['@context'] = ActivityPub::CONTEXT;
$compacted = self::internalCompact($json);
if (empty($compacted)) {
Logger::info('Failed to compact with our context');
$json['@context'] = $context;
$compacted = self::internalCompact($json);
if (empty($compacted)) {
Logger::info('Failed to compact with original context');
} else {
Logger::info('Successful compacted with original context');
}
}
return $compacted;
}
private static function internalCompact($json)
{
2021-05-16 10:32:06 -04:00
$json = self::fixContext($json);
jsonld_set_document_loader('Friendica\Util\JsonLD::documentLoader');
2018-10-07 09:37:05 -04:00
$context = (object)['as' => 'https://www.w3.org/ns/activitystreams#',
2021-05-16 10:59:02 -04:00
'w3id' => (object)['@id' => 'https://w3id.org/security#', '@type' => '@id'],
'ldp' => (object)['@id' => 'http://www.w3.org/ns/ldp#', '@type' => '@id'],
'vcard' => (object)['@id' => 'http://www.w3.org/2006/vcard/ns#', '@type' => '@id'],
'dfrn' => (object)['@id' => 'http://purl.org/macgirvin/dfrn/1.0/', '@type' => '@id'],
2018-10-07 09:37:05 -04:00
'diaspora' => (object)['@id' => 'https://diasporafoundation.org/ns/', '@type' => '@id'],
'ostatus' => (object)['@id' => 'http://ostatus.org#', '@type' => '@id'],
'dc' => (object)['@id' => 'http://purl.org/dc/terms/', '@type' => '@id'],
'toot' => (object)['@id' => 'http://joinmastodon.org/ns#', '@type' => '@id'],
2020-03-02 02:57:23 -05:00
'litepub' => (object)['@id' => 'http://litepub.social/ns#', '@type' => '@id'],
'sc' => (object)['@id' => 'http://schema.org#', '@type' => '@id'],
'pt' => (object)['@id' => 'https://joinpeertube.org/ns#', '@type' => '@id']];
// Trying to avoid memory problems with large content fields
if (!empty($json['object']['source']['content'])) {
$content = $json['object']['source']['content'];
$json['object']['source']['content'] = '';
}
$jsonobj = json_decode(json_encode($json, JSON_UNESCAPED_SLASHES | JSON_UNESCAPED_UNICODE));
try {
$compacted = jsonld_compact($jsonobj, $context);
}
catch (Exception $e) {
$compacted = false;
Logger::error('compacting error', ['line' => $e->getLine(), 'message' => $e->getMessage(),'callstack' => System::callstack(20)]);
}
$json = json_decode(json_encode($compacted, JSON_UNESCAPED_SLASHES | JSON_UNESCAPED_UNICODE), true);
if (isset($json['as:object']['as:source']['as:content']) && !empty($content)) {
$json['as:object']['as:source']['as:content'] = $content;
}
return $json;
}
2018-09-20 01:37:01 -04:00
2018-10-07 09:37:05 -04:00
/**
2020-01-19 01:05:23 -05:00
* Fetches an element array from a JSON array
2018-10-07 09:37:05 -04:00
*
* @param $array
* @param $element
* @param $key
*
2019-01-06 16:06:53 -05:00
* @return array fetched element
2018-10-07 09:37:05 -04:00
*/
public static function fetchElementArray($array, $element, $key = null, $type = null, $type_value = null)
2018-10-07 09:37:05 -04:00
{
if (!isset($array[$element])) {
return null;
}
// If it isn't an array yet, make it to one
if (!is_int(key($array[$element]))) {
$array[$element] = [$array[$element]];
}
$elements = [];
foreach ($array[$element] as $entry) {
if (!is_array($entry) || is_null($key)) {
$item = $entry;
} elseif (isset($entry[$key])) {
$item = $entry[$key];
}
if (isset($item) && (is_null($type) || is_null($type_value) || isset($item[$type]) && $item[$type] == $type_value)) {
$elements[] = $item;
2018-10-07 09:37:05 -04:00
}
}
return $elements;
}
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Fetches an element from a JSON array
2018-09-26 18:02:14 -04:00
*
* @param $array
* @param $element
* @param $key
* @param $type
* @param $type_value
*
2019-01-06 16:06:53 -05:00
* @return string fetched element
2018-09-26 18:02:14 -04:00
*/
2018-10-07 09:37:05 -04:00
public static function fetchElement($array, $element, $key = '@id', $type = null, $type_value = null)
2018-09-20 01:37:01 -04:00
{
if (empty($array)) {
2018-10-07 09:37:05 -04:00
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
if (!isset($array[$element])) {
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
if (!is_array($array[$element])) {
2018-09-20 01:37:01 -04:00
return $array[$element];
}
2018-10-07 09:37:05 -04:00
if (is_null($type) || is_null($type_value)) {
$element_array = self::fetchElementArray($array, $element, $key);
if (is_null($element_array)) {
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
return array_shift($element_array);
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
$element_array = self::fetchElementArray($array, $element);
if (is_null($element_array)) {
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
foreach ($element_array as $entry) {
if (isset($entry[$key]) && isset($entry[$type]) && ($entry[$type] == $type_value)) {
return $entry[$key];
}
}
2018-09-20 01:37:01 -04:00
2018-10-07 09:37:05 -04:00
return null;
2018-09-20 01:37:01 -04:00
}
}