André Menrath
21d1ee9915
Some checks failed
PHP Code Checker / PHP Code Checker (pull_request) Failing after 45s
PHPUnit / PHPUnit – PHP 7.4 (pull_request) Failing after 57s
PHPUnit / PHPUnit – PHP 8.0 (pull_request) Failing after 57s
PHPUnit / PHPUnit – PHP 8.1 (pull_request) Failing after 56s
PHPUnit / PHPUnit – PHP 8.2 (pull_request) Failing after 51s
PHPUnit / PHPUnit – PHP 8.3 (pull_request) Failing after 55s
PHPUnit / PHPUnit – PHP 8.4 (pull_request) Failing after 52s
272 lines
7.7 KiB
PHP
272 lines
7.7 KiB
PHP
<?php
|
|
/**
|
|
* Class file for parsing an ActivityPub outbox for Events.
|
|
*
|
|
* The main external entry function is `backfill_events`.
|
|
* The function `import_events_from_outbox` is used for delaying the parsing via schedules.
|
|
*
|
|
* @package Event_Bridge_For_ActivityPub
|
|
* @since 1.0.0
|
|
* @license AGPL-3.0-or-later
|
|
*/
|
|
|
|
namespace Event_Bridge_For_ActivityPub;
|
|
|
|
use Activitypub\Http;
|
|
use Event_Bridge_For_ActivityPub\ActivityPub\Model\Event_Source;
|
|
|
|
/**
|
|
* Class for parsing an ActivityPub outbox for Events.
|
|
*
|
|
* The main external entry function is `backfill_events`.
|
|
* The function `import_events_from_outbox` is used for delaying the parsing via schedules.
|
|
*/
|
|
class Outbox_Parser {
|
|
/**
|
|
* Maximum number of events to backfill per actor.
|
|
*/
|
|
const MAX_EVENTS_TO_IMPORT = 20;
|
|
|
|
/**
|
|
* Init actions.
|
|
*/
|
|
public static function init() {
|
|
// Add action for backfilling the events.
|
|
\add_action( 'event_bridge_for_activitypub_backfill_events', array( self::class, 'backfill_events' ), 10, 1 );
|
|
\add_action( 'event_bridge_for_activitypub_import_events_from_outbox', array( self::class, 'import_events_from_outbox' ), 10, 2 );
|
|
}
|
|
|
|
/**
|
|
* Initialize the backfilling of events via the outbox of an ActivityPub actor.
|
|
*
|
|
* @param string $actor The ActivityPub ID of the actor which owns the outbox.
|
|
* @return bool|WP_Error
|
|
*/
|
|
public static function backfill_events( $actor ) {
|
|
// Initiate parsing of outbox collection.
|
|
$event_source = Event_Source::get_by_id( $actor );
|
|
|
|
if ( ! $event_source ) {
|
|
return;
|
|
}
|
|
|
|
$outbox_url = $event_source->get_outbox();
|
|
|
|
if ( ! $outbox_url ) {
|
|
return;
|
|
}
|
|
|
|
// Schedule the import of events via the outbox.
|
|
return self::queue_importing_from_outbox( $outbox_url, $actor, 0 );
|
|
}
|
|
|
|
/**
|
|
* Import events from an outbox: OrderedCollection or OrderedCollectionPage.
|
|
*
|
|
* @param string $url The url of the current page or outbox.
|
|
* @param string $actor The ActivityPub ID/URL of the actor that owns the outbox.
|
|
* @return void
|
|
*/
|
|
public static function import_events_from_outbox( $url, $actor ) {
|
|
$outbox = self::fetch_outbox( $url );
|
|
|
|
if ( ! $outbox ) {
|
|
return;
|
|
}
|
|
|
|
$current_count = self::get_import_count( $actor );
|
|
|
|
if ( $current_count >= self::MAX_EVENTS_TO_IMPORT ) {
|
|
return;
|
|
}
|
|
|
|
// Process orderedItems if they exist (non-paginated outbox).
|
|
if ( isset( $outbox['orderedItems'] ) && is_array( $outbox['orderedItems'] ) ) {
|
|
$current_count += self::import_events_from_items(
|
|
$outbox['orderedItems'],
|
|
$actor,
|
|
self::MAX_EVENTS_TO_IMPORT - $current_count
|
|
);
|
|
}
|
|
|
|
self::update_import_count( $actor, $current_count );
|
|
|
|
// If the count is already exceeded abort here.
|
|
if ( $current_count >= self::MAX_EVENTS_TO_IMPORT ) {
|
|
return;
|
|
}
|
|
|
|
// Get next page and if it exists schedule the import of next page.
|
|
$pagination_url = self::get_pagination_url( $outbox );
|
|
|
|
if ( $pagination_url ) {
|
|
self::queue_importing_from_outbox( $pagination_url, $actor );
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Check if an Activity is of type Update or Create.
|
|
*
|
|
* @param array $activity The Activity as associative array.
|
|
* @return bool
|
|
*/
|
|
private static function is_create_or_update_activity( $activity ) {
|
|
if ( ! isset( $activity['type'] ) ) {
|
|
return false;
|
|
}
|
|
if ( in_array( $activity['type'], array( 'Update', 'Create' ), true ) ) {
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
/**
|
|
* Parses items from an Collection, OrderedCollection, CollectionPage or OrderedCollectionPage.
|
|
*
|
|
* @param array $items The items as an associative array.
|
|
* @param int $max_items The maximum number of items to parse.
|
|
* @return array Parsed events from the collection.
|
|
*/
|
|
private static function parse_items_for_events( $items, $max_items ) {
|
|
$parsed_events = array();
|
|
|
|
foreach ( $items as $activity ) {
|
|
// Abort if we have exceeded the maximal events to return.
|
|
if ( $max_items > 0 && count( $parsed_events ) >= $max_items ) {
|
|
break;
|
|
}
|
|
|
|
// Check if it is a create or update Activity.
|
|
if ( ! self::is_create_or_update_activity( $activity ) ) {
|
|
continue;
|
|
}
|
|
|
|
// If no object is set we cannot process anything.
|
|
if ( ! isset( $activity['object'] ) ) {
|
|
continue;
|
|
}
|
|
|
|
// Check if the Event object meets the minimum requirements and is valid.
|
|
$is_valid = Event_Sources::is_valid_activitypub_event_object( $activity['object'] );
|
|
if ( ! $is_valid || \is_wp_error( $is_valid ) ) {
|
|
continue;
|
|
}
|
|
|
|
// Check if the event is in the future or ongoing.
|
|
if ( Event_Sources::is_ongoing_or_future_event( $activity['object'] ) ) {
|
|
$parsed_events[] = $activity['object'];
|
|
}
|
|
}
|
|
|
|
return $parsed_events;
|
|
}
|
|
|
|
/**
|
|
* Import events from the items of an outbox.
|
|
*
|
|
* @param array $items The items/orderedItems as an associative array.
|
|
* @param string $actor The actor that owns the items.
|
|
* @param int $limit The limit of how many events to save locally.
|
|
* @return int The number of saved events (at least attempted).
|
|
*/
|
|
private static function import_events_from_items( $items, $actor, $limit = -1 ) {
|
|
$events = self::parse_items_for_events( $items, $limit );
|
|
|
|
$transmogrifier = Setup::get_transmogrifier();
|
|
|
|
if ( ! $transmogrifier ) {
|
|
return;
|
|
}
|
|
|
|
$imported_count = 0;
|
|
|
|
foreach ( $events as $event ) {
|
|
$transmogrifier->save( $event, $actor );
|
|
++$imported_count;
|
|
if ( $limit > 0 && $imported_count >= $limit ) {
|
|
break;
|
|
}
|
|
}
|
|
|
|
return $imported_count;
|
|
}
|
|
|
|
/**
|
|
* Schedule the import of events from an outbox OrderedCollection or OrderedCollectionPage.
|
|
*
|
|
* @param string $url The url of the current page or outbox.
|
|
* @param string $actor The ActivityPub ID/URL of the actor that owns the outbox.
|
|
* @param int $delay The delay of the current time in seconds.
|
|
* @return void
|
|
*/
|
|
private static function queue_importing_from_outbox( $url, $actor, $delay = 10 ) {
|
|
$hook = 'event_bridge_for_activitypub_import_events_from_outbox';
|
|
$args = array( $url, $actor );
|
|
|
|
if ( \wp_next_scheduled( $hook, $args ) ) {
|
|
return;
|
|
}
|
|
|
|
return \wp_schedule_single_event( \time() + $delay, $hook, $args );
|
|
}
|
|
|
|
/**
|
|
* Get the current import count for the actor.
|
|
*
|
|
* @param string $actor The actor's ID/URL.
|
|
* @return int The current count of imported events.
|
|
*/
|
|
private static function get_import_count( $actor ) {
|
|
$post_id = Event_Source::get_by_id( $actor )->ID;
|
|
return (int) \get_post_meta( $post_id, '_event_bridge_for_activitypub_event_count', true );
|
|
}
|
|
|
|
/**
|
|
* Update the import count for the actor.
|
|
*
|
|
* @param string $actor The actor's ID/URL.
|
|
* @param int $count The new count of imported events.
|
|
* @return void
|
|
*/
|
|
private static function update_import_count( $actor, $count ) {
|
|
$post_id = Event_Source::get_by_id( $actor )->ID;
|
|
\update_post_meta( $post_id, '_event_bridge_for_activitypub_event_count', $count );
|
|
}
|
|
|
|
/**
|
|
* Fetch the outbox from the given URL.
|
|
*
|
|
* @param string $url The URL of the outbox.
|
|
* @return array|null The decoded outbox data, or null if fetching fails.
|
|
*/
|
|
private static function fetch_outbox( $url ) {
|
|
$response = Http::get( $url );
|
|
|
|
if ( \is_wp_error( $response ) ) {
|
|
return null;
|
|
}
|
|
|
|
$outbox = \wp_remote_retrieve_body( $response );
|
|
$outbox = \json_decode( $outbox, true );
|
|
|
|
return ( is_array( $outbox ) && isset( $outbox['type'] ) && isset( $outbox['id'] ) ) ? $outbox : null;
|
|
}
|
|
|
|
/**
|
|
* Get the pagination URL from the outbox.
|
|
*
|
|
* @param array $outbox The outbox data.
|
|
* @return string|null The pagination URL, or null if not found.
|
|
*/
|
|
private static function get_pagination_url( $outbox ) {
|
|
if ( 'OrderedCollection' === $outbox['type'] && ! empty( $outbox['first'] ) && is_string( $outbox['first'] ) ) {
|
|
return $outbox['first'];
|
|
}
|
|
|
|
if ( 'OrderedCollectionPage' === $outbox['type'] && ! empty( $outbox['next'] ) && is_string( $outbox['next'] ) ) {
|
|
return $outbox['next'];
|
|
}
|
|
|
|
return null;
|
|
}
|
|
}
|