friendica/src/Util/JsonLD.php

292 lines
8.3 KiB
PHP
Raw Normal View History

<?php
/**
2022-01-02 02:27:47 -05:00
* @copyright Copyright (C) 2010-2022, the Friendica project
*
* @license GNU AGPL version 3 or any later version
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as
* published by the Free Software Foundation, either version 3 of the
* License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see <https://www.gnu.org/licenses/>.
*
*/
namespace Friendica\Util;
use Friendica\Core\Cache\Enum\Duration;
2018-10-29 17:20:46 -04:00
use Friendica\Core\Logger;
2018-09-26 18:45:13 -04:00
use Exception;
2022-05-17 22:13:54 -04:00
use Friendica\Core\System;
use Friendica\DI;
/**
2020-01-19 01:05:23 -05:00
* This class contain methods to work with JsonLD data
*/
class JsonLD
{
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Loader for LD-JSON validation
2018-09-26 18:02:14 -04:00
*
* @param $url
*
2019-01-06 16:06:53 -05:00
* @return mixed the loaded data
* @throws \JsonLdException
2018-09-26 18:02:14 -04:00
*/
public static function documentLoader($url)
{
switch ($url) {
case 'https://w3id.org/security/v1':
$url = DI::baseUrl() . '/static/security-v1.jsonld';
break;
case 'https://w3id.org/identity/v1':
$url = DI::baseUrl() . '/static/identity-v1.jsonld';
break;
case 'https://www.w3.org/ns/activitystreams':
$url = DI::baseUrl() . '/static/activitystreams.jsonld';
break;
2022-07-16 05:25:12 -04:00
case 'https://funkwhale.audio/ns':
$url = DI::baseUrl() . '/static/funkwhale.audio.jsonld';
break;
2022-07-16 05:25:12 -04:00
default:
switch (parse_url($url, PHP_URL_PATH)) {
case '/schemas/litepub-0.1.jsonld';
$url = DI::baseUrl() . '/static/litepub-0.1.jsonld';
break;
case '/apschema/v1.2':
case '/apschema/v1.9':
case '/apschema/v1.10':
$url = DI::baseUrl() . '/static/apschema.jsonld';
break;
default:
Logger::info('Got url', ['url' =>$url]);
break;
}
}
$recursion = 0;
$x = debug_backtrace();
if ($x) {
foreach ($x as $n) {
if ($n['function'] === __FUNCTION__) {
$recursion ++;
}
}
}
if ($recursion > 5) {
Logger::error('jsonld bomb detected at: ' . $url);
2022-05-17 22:13:54 -04:00
System::exit();
}
$result = DI::cache()->get('documentLoader:' . $url);
if (!is_null($result)) {
return $result;
}
$data = jsonld_default_document_loader($url);
DI::cache()->set('documentLoader:' . $url, $data, Duration::DAY);
return $data;
}
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Normalises a given JSON array
2018-09-26 18:02:14 -04:00
*
* @param array $json
*
2019-01-06 16:06:53 -05:00
* @return mixed|bool normalized JSON string
* @throws Exception
2018-09-26 18:02:14 -04:00
*/
public static function normalize($json)
{
jsonld_set_document_loader('Friendica\Util\JsonLD::documentLoader');
$jsonobj = json_decode(json_encode($json, JSON_UNESCAPED_SLASHES | JSON_UNESCAPED_UNICODE));
2018-09-26 18:45:13 -04:00
try {
$normalized = jsonld_normalize($jsonobj, array('algorithm' => 'URDNA2015', 'format' => 'application/nquads'));
}
catch (Exception $e) {
2018-10-02 04:31:58 -04:00
$normalized = false;
$messages = [];
$currentException = $e;
do {
$messages[] = $currentException->getMessage();
} while($currentException = $currentException->getPrevious());
Logger::warning('JsonLD normalize error');
Logger::notice('JsonLD normalize error', ['messages' => $messages]);
Logger::info('JsonLD normalize error', ['trace' => $e->getTraceAsString()]);
Logger::debug('JsonLD normalize error', ['jsonobj' => $jsonobj]);
2018-09-26 18:45:13 -04:00
}
return $normalized;
}
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Compacts a given JSON array
2018-09-26 18:02:14 -04:00
*
* @param array $json
2022-07-16 05:25:12 -04:00
* @param bool $logfailed
2018-09-26 18:02:14 -04:00
*
2019-01-06 16:06:53 -05:00
* @return array Compacted JSON array
* @throws Exception
2018-09-26 18:02:14 -04:00
*/
2022-07-16 05:25:12 -04:00
public static function compact($json, bool $logfailed = true)
{
jsonld_set_document_loader('Friendica\Util\JsonLD::documentLoader');
2018-10-07 09:37:05 -04:00
$context = (object)['as' => 'https://www.w3.org/ns/activitystreams#',
'w3id' => 'https://w3id.org/security#',
'ldp' => (object)['@id' => 'http://www.w3.org/ns/ldp#', '@type' => '@id'],
'vcard' => (object)['@id' => 'http://www.w3.org/2006/vcard/ns#', '@type' => '@id'],
'dfrn' => (object)['@id' => 'http://purl.org/macgirvin/dfrn/1.0/', '@type' => '@id'],
2018-10-07 09:37:05 -04:00
'diaspora' => (object)['@id' => 'https://diasporafoundation.org/ns/', '@type' => '@id'],
'ostatus' => (object)['@id' => 'http://ostatus.org#', '@type' => '@id'],
'dc' => (object)['@id' => 'http://purl.org/dc/terms/', '@type' => '@id'],
'toot' => (object)['@id' => 'http://joinmastodon.org/ns#', '@type' => '@id'],
2020-03-02 02:57:23 -05:00
'litepub' => (object)['@id' => 'http://litepub.social/ns#', '@type' => '@id'],
'sc' => (object)['@id' => 'http://schema.org#', '@type' => '@id'],
2022-04-25 09:45:03 -04:00
'pt' => (object)['@id' => 'https://joinpeertube.org/ns#', '@type' => '@id'],
'mobilizon' => (object)['@id' => 'https://joinmobilizon.org/ns#', '@type' => '@id'],
];
2022-07-16 05:25:12 -04:00
$orig_json = $json;
// Preparation for adding possibly missing content to the context
if (!empty($json['@context']) && is_string($json['@context'])) {
$json['@context'] = [$json['@context']];
}
if (!empty($json['@context']) && is_array($json['@context'])) {
2022-07-16 05:25:12 -04:00
// Remove empty entries from the context (a problem with WriteFreely)
$json['@context'] = array_filter($json['@context']);
2022-07-16 05:25:12 -04:00
// Workaround for servers with missing context
// See issue https://github.com/nextcloud/social/issues/330
if (!in_array('https://w3id.org/security/v1', $json['@context'])) {
$json['@context'][] = 'https://w3id.org/security/v1';
}
}
2022-07-23 08:50:15 -04:00
// Bookwyrm transmits "id" fields with "null", which isn't allowed.
array_walk_recursive($json, function (&$value, $key) {
if ($key == 'id' && is_null($value)) {
$value = '';
}
});
$jsonobj = json_decode(json_encode($json, JSON_UNESCAPED_SLASHES | JSON_UNESCAPED_UNICODE));
try {
$compacted = jsonld_compact($jsonobj, $context);
}
catch (Exception $e) {
$compacted = false;
2022-07-16 05:25:12 -04:00
Logger::notice('compacting error', ['msg' => $e->getMessage(), 'previous' => $e->getPrevious(), 'line' => $e->getLine()]);
if ($logfailed && DI::config()->get('debug', 'ap_log_failure')) {
$tempfile = tempnam(System::getTempPath(), 'failed-jsonld');
file_put_contents($tempfile, json_encode(['json' => $orig_json, 'callstack' => System::callstack(20), 'msg' => $e->getMessage(), 'previous' => $e->getPrevious()], JSON_UNESCAPED_SLASHES | JSON_UNESCAPED_UNICODE | JSON_PRETTY_PRINT));
Logger::notice('Failed message stored', ['file' => $tempfile]);
}
}
$json = json_decode(json_encode($compacted, JSON_UNESCAPED_SLASHES | JSON_UNESCAPED_UNICODE), true);
return $json;
}
2018-09-20 01:37:01 -04:00
2018-10-07 09:37:05 -04:00
/**
2020-01-19 01:05:23 -05:00
* Fetches an element array from a JSON array
2018-10-07 09:37:05 -04:00
*
* @param $array
* @param $element
* @param $key
*
2019-01-06 16:06:53 -05:00
* @return array fetched element
2018-10-07 09:37:05 -04:00
*/
public static function fetchElementArray($array, $element, $key = null, $type = null, $type_value = null)
2018-10-07 09:37:05 -04:00
{
if (!isset($array[$element])) {
return null;
}
// If it isn't an array yet, make it to one
2021-08-12 09:12:41 -04:00
if (!is_array($array[$element]) || !is_int(key($array[$element]))) {
2018-10-07 09:37:05 -04:00
$array[$element] = [$array[$element]];
}
$elements = [];
foreach ($array[$element] as $entry) {
if (!is_array($entry) || is_null($key)) {
$item = $entry;
} elseif (isset($entry[$key])) {
$item = $entry[$key];
}
if (isset($item) && (is_null($type) || is_null($type_value) || isset($item[$type]) && $item[$type] == $type_value)) {
$elements[] = $item;
2018-10-07 09:37:05 -04:00
}
}
return $elements;
}
2018-09-26 18:02:14 -04:00
/**
2020-01-19 01:05:23 -05:00
* Fetches an element from a JSON array
2018-09-26 18:02:14 -04:00
*
* @param $array
* @param $element
* @param $key
* @param $type
* @param $type_value
*
2019-01-06 16:06:53 -05:00
* @return string fetched element
2018-09-26 18:02:14 -04:00
*/
2018-10-07 09:37:05 -04:00
public static function fetchElement($array, $element, $key = '@id', $type = null, $type_value = null)
2018-09-20 01:37:01 -04:00
{
if (empty($array)) {
2018-10-07 09:37:05 -04:00
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
if (!isset($array[$element])) {
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
if (!is_array($array[$element])) {
2018-09-20 01:37:01 -04:00
return $array[$element];
}
2018-10-07 09:37:05 -04:00
if (is_null($type) || is_null($type_value)) {
$element_array = self::fetchElementArray($array, $element, $key);
if (is_null($element_array)) {
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
return array_shift($element_array);
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
$element_array = self::fetchElementArray($array, $element);
if (is_null($element_array)) {
return null;
2018-09-20 01:37:01 -04:00
}
2018-10-07 09:37:05 -04:00
foreach ($element_array as $entry) {
if (isset($entry[$key]) && isset($entry[$type]) && ($entry[$type] == $type_value)) {
return $entry[$key];
}
}
2018-09-20 01:37:01 -04:00
2018-10-07 09:37:05 -04:00
return null;
2018-09-20 01:37:01 -04:00
}
}