bookmarks/lib/BackgroundJobs/CrawlJob.php

58 lines
1.4 KiB
PHP

<?php
/*
* Copyright (c) 2020-2024. The Nextcloud Bookmarks contributors.
*
* This file is licensed under the Affero General Public License version 3 or later. See the COPYING file.
*/
namespace OCA\Bookmarks\BackgroundJobs;
use OCA\Bookmarks\Db\Bookmark;
use OCA\Bookmarks\Db\BookmarkMapper;
use OCA\Bookmarks\Service\BookmarkPreviewer;
use OCA\Bookmarks\Service\CrawlService;
use OCP\AppFramework\Utility\ITimeFactory;
use OCP\BackgroundJob\TimedJob;
use OCP\IConfig;
class CrawlJob extends TimedJob {
public const BATCH_SIZE = 40; // 40 bookmarks
public const INTERVAL = 5 * 60; // 5 minutes
/**
* @var BookmarkMapper
*/
private $bookmarkMapper;
/**
* @var IConfig
*/
private $settings;
/**
* @var CrawlService
*/
private $crawler;
public function __construct(
IConfig $settings, BookmarkMapper $bookmarkMapper, CrawlService $crawler, ITimeFactory $timeFactory
) {
parent::__construct($timeFactory);
$this->settings = $settings;
$this->bookmarkMapper = $bookmarkMapper;
$this->setInterval(self::INTERVAL);
$this->crawler = $crawler;
}
protected function run($argument) {
if ($this->settings->getAppValue('bookmarks', 'privacy.enableScraping', 'false') !== 'true') {
return;
}
/** @var Bookmark[] $bookmarks */
$bookmarks = $this->bookmarkMapper->findPendingPreviews(self::BATCH_SIZE, BookmarkPreviewer::CACHE_TTL);
foreach ($bookmarks as $bookmark) {
$this->crawler->crawl($bookmark);
}
}
}