mirror of https://github.com/nextcloud/bookmarks
58 lines
1.4 KiB
PHP
58 lines
1.4 KiB
PHP
<?php
|
|
/*
|
|
* Copyright (c) 2020-2024. The Nextcloud Bookmarks contributors.
|
|
*
|
|
* This file is licensed under the Affero General Public License version 3 or later. See the COPYING file.
|
|
*/
|
|
|
|
namespace OCA\Bookmarks\BackgroundJobs;
|
|
|
|
use OCA\Bookmarks\Db\Bookmark;
|
|
use OCA\Bookmarks\Db\BookmarkMapper;
|
|
use OCA\Bookmarks\Service\BookmarkPreviewer;
|
|
use OCA\Bookmarks\Service\CrawlService;
|
|
use OCP\AppFramework\Utility\ITimeFactory;
|
|
use OCP\BackgroundJob\TimedJob;
|
|
use OCP\IConfig;
|
|
|
|
class CrawlJob extends TimedJob {
|
|
public const BATCH_SIZE = 40; // 40 bookmarks
|
|
public const INTERVAL = 5 * 60; // 5 minutes
|
|
|
|
/**
|
|
* @var BookmarkMapper
|
|
*/
|
|
private $bookmarkMapper;
|
|
/**
|
|
* @var IConfig
|
|
*/
|
|
private $settings;
|
|
/**
|
|
* @var CrawlService
|
|
*/
|
|
private $crawler;
|
|
|
|
public function __construct(
|
|
IConfig $settings, BookmarkMapper $bookmarkMapper, CrawlService $crawler, ITimeFactory $timeFactory
|
|
) {
|
|
parent::__construct($timeFactory);
|
|
$this->settings = $settings;
|
|
$this->bookmarkMapper = $bookmarkMapper;
|
|
|
|
$this->setInterval(self::INTERVAL);
|
|
$this->crawler = $crawler;
|
|
}
|
|
|
|
protected function run($argument) {
|
|
if ($this->settings->getAppValue('bookmarks', 'privacy.enableScraping', 'false') !== 'true') {
|
|
return;
|
|
}
|
|
|
|
/** @var Bookmark[] $bookmarks */
|
|
$bookmarks = $this->bookmarkMapper->findPendingPreviews(self::BATCH_SIZE, BookmarkPreviewer::CACHE_TTL);
|
|
foreach ($bookmarks as $bookmark) {
|
|
$this->crawler->crawl($bookmark);
|
|
}
|
|
}
|
|
}
|