aboutsummaryrefslogtreecommitdiffstats
path: root/apps/files_sharing/lib/DeleteOrphanedSharesJob.php
diff options
context:
space:
mode:
Diffstat (limited to 'apps/files_sharing/lib/DeleteOrphanedSharesJob.php')
-rw-r--r--apps/files_sharing/lib/DeleteOrphanedSharesJob.php133
1 files changed, 133 insertions, 0 deletions
diff --git a/apps/files_sharing/lib/DeleteOrphanedSharesJob.php b/apps/files_sharing/lib/DeleteOrphanedSharesJob.php
new file mode 100644
index 00000000000..63f057e3bf4
--- /dev/null
+++ b/apps/files_sharing/lib/DeleteOrphanedSharesJob.php
@@ -0,0 +1,133 @@
+<?php
+
+declare(strict_types=1);
+/**
+ * SPDX-FileCopyrightText: 2020-2024 Nextcloud GmbH and Nextcloud contributors
+ * SPDX-FileCopyrightText: 2016 ownCloud, Inc.
+ * SPDX-License-Identifier: AGPL-3.0-only
+ */
+namespace OCA\Files_Sharing;
+
+use OCP\AppFramework\Db\TTransactional;
+use OCP\AppFramework\Utility\ITimeFactory;
+use OCP\BackgroundJob\TimedJob;
+use OCP\DB\QueryBuilder\IQueryBuilder;
+use OCP\IDBConnection;
+use PDO;
+use Psr\Log\LoggerInterface;
+use function array_map;
+
+/**
+ * Delete all share entries that have no matching entries in the file cache table.
+ */
+class DeleteOrphanedSharesJob extends TimedJob {
+
+ use TTransactional;
+
+ private const CHUNK_SIZE = 1000;
+
+ private const INTERVAL = 24 * 60 * 60;
+
+ /**
+ * sets the correct interval for this timed job
+ */
+ public function __construct(
+ ITimeFactory $time,
+ private IDBConnection $db,
+ private LoggerInterface $logger,
+ ) {
+ parent::__construct($time);
+
+ $this->setInterval(self::INTERVAL); // 1 day
+ $this->setTimeSensitivity(self::TIME_INSENSITIVE);
+ }
+
+ /**
+ * Makes the background job do its work
+ *
+ * @param array $argument unused argument
+ */
+ public function run($argument) {
+ if ($this->db->getShardDefinition('filecache')) {
+ $this->shardingCleanup();
+ return;
+ }
+
+ $qbSelect = $this->db->getQueryBuilder();
+ $qbSelect->select('id')
+ ->from('share', 's')
+ ->leftJoin('s', 'filecache', 'fc', $qbSelect->expr()->eq('s.file_source', 'fc.fileid'))
+ ->where($qbSelect->expr()->isNull('fc.fileid'))
+ ->setMaxResults(self::CHUNK_SIZE);
+ $deleteQb = $this->db->getQueryBuilder();
+ $deleteQb->delete('share')
+ ->where(
+ $deleteQb->expr()->in('id', $deleteQb->createParameter('ids'), IQueryBuilder::PARAM_INT_ARRAY)
+ );
+
+ /**
+ * Read a chunk of orphan rows and delete them. Continue as long as the
+ * chunk is filled and time before the next cron run does not run out.
+ *
+ * Note: With isolation level READ COMMITTED, the database will allow
+ * other transactions to delete rows between our SELECT and DELETE. In
+ * that (unlikely) case, our DELETE will have fewer affected rows than
+ * IDs passed for the WHERE IN. If this happens while processing a full
+ * chunk, the logic below will stop prematurely.
+ * Note: The queries below are optimized for low database locking. They
+ * could be combined into one single DELETE with join or sub query, but
+ * that has shown to (dead)lock often.
+ */
+ $cutOff = $this->time->getTime() + self::INTERVAL;
+ do {
+ $deleted = $this->atomic(function () use ($qbSelect, $deleteQb) {
+ $result = $qbSelect->executeQuery();
+ $ids = array_map('intval', $result->fetchAll(PDO::FETCH_COLUMN));
+ $result->closeCursor();
+ $deleteQb->setParameter('ids', $ids, IQueryBuilder::PARAM_INT_ARRAY);
+ $deleted = $deleteQb->executeStatement();
+ $this->logger->debug('{deleted} orphaned share(s) deleted', [
+ 'app' => 'DeleteOrphanedSharesJob',
+ 'deleted' => $deleted,
+ ]);
+ return $deleted;
+ }, $this->db);
+ } while ($deleted >= self::CHUNK_SIZE && $this->time->getTime() <= $cutOff);
+ }
+
+ private function shardingCleanup(): void {
+ $qb = $this->db->getQueryBuilder();
+ $qb->selectDistinct('file_source')
+ ->from('share', 's');
+ $sourceFiles = $qb->executeQuery()->fetchAll(PDO::FETCH_COLUMN);
+
+ $deleteQb = $this->db->getQueryBuilder();
+ $deleteQb->delete('share')
+ ->where(
+ $deleteQb->expr()->in('file_source', $deleteQb->createParameter('ids'), IQueryBuilder::PARAM_INT_ARRAY)
+ );
+
+ $chunks = array_chunk($sourceFiles, self::CHUNK_SIZE);
+ foreach ($chunks as $chunk) {
+ $deletedFiles = $this->findMissingSources($chunk);
+ $this->atomic(function () use ($deletedFiles, $deleteQb) {
+ $deleteQb->setParameter('ids', $deletedFiles, IQueryBuilder::PARAM_INT_ARRAY);
+ $deleted = $deleteQb->executeStatement();
+ $this->logger->debug('{deleted} orphaned share(s) deleted', [
+ 'app' => 'DeleteOrphanedSharesJob',
+ 'deleted' => $deleted,
+ ]);
+ return $deleted;
+ }, $this->db);
+ }
+ }
+
+ private function findMissingSources(array $ids): array {
+ $qb = $this->db->getQueryBuilder();
+ $qb->select('fileid')
+ ->from('filecache')
+ ->where($qb->expr()->in('fileid', $qb->createNamedParameter($ids, IQueryBuilder::PARAM_INT_ARRAY)));
+ $found = $qb->executeQuery()->fetchAll(\PDO::FETCH_COLUMN);
+ return array_diff($ids, $found);
+ }
+}