1
0
Fork 0
mirror of synced 2024-06-02 10:54:44 +12:00
appwrite/app/workers/deletes.php

413 lines
13 KiB
PHP
Raw Normal View History

<?php
2021-07-14 07:24:52 +12:00
use Utopia\Database\Database;
use Utopia\Database\Document;
2021-07-13 09:57:37 +12:00
use Utopia\Database\Query;
2021-07-14 07:24:52 +12:00
use Utopia\Database\Validator\Authorization;
use Appwrite\Resque\Worker;
2021-01-22 21:28:33 +13:00
use Utopia\Storage\Device\Local;
2020-12-19 03:08:28 +13:00
use Utopia\Abuse\Abuse;
use Utopia\Abuse\Adapters\TimeLimit;
use Utopia\CLI\Console;
use Utopia\Audit\Audit;
use Utopia\Cache\Adapter\Redis as RedisCache;
2021-06-07 17:17:29 +12:00
use Utopia\Cache\Cache;
use Utopia\Database\Adapter\MariaDB;
require_once __DIR__.'/../workers.php';
2020-12-19 21:08:03 +13:00
2021-01-15 19:02:48 +13:00
Console::title('Deletes V1 Worker');
2020-12-19 21:08:03 +13:00
Console::success(APP_NAME.' deletes worker v1 has started'."\n");
class DeletesV1 extends Worker
{
public $args = [];
protected $consoleDB = null;
public function init(): void
{
}
public function run(): void
{
2021-06-12 22:07:26 +12:00
$projectId = $this->args['projectId'] ?? '';
$type = $this->args['type'] ?? '';
switch (strval($type)) {
2020-12-19 03:05:15 +13:00
case DELETE_TYPE_DOCUMENT:
2021-06-12 22:07:26 +12:00
$document = $this->args['document'] ?? '';
2021-07-14 07:24:52 +12:00
$document = new Document($document);
2021-06-12 22:07:26 +12:00
switch ($document->getCollection()) {
2021-07-14 07:24:52 +12:00
// TODO@kodumbeats define these as constants somewhere
case 'projects':
$this->deleteProject($document);
break;
2021-07-14 07:24:52 +12:00
case 'functions':
$this->deleteFunction($document, $projectId);
break;
2021-07-14 07:24:52 +12:00
case 'users':
$this->deleteUser($document, $projectId);
break;
2021-07-14 07:24:52 +12:00
case 'teams':
$this->deleteMemberships($document, $projectId);
break;
2021-07-28 22:09:29 +12:00
case 'buckets':
$this->deleteBucket($document, $projectId);
break;
default:
Console::error('No lazy delete operation available for document of type: '.$document->getCollection());
break;
}
2020-12-15 10:26:37 +13:00
break;
2020-12-22 07:15:52 +13:00
2020-12-28 06:57:35 +13:00
case DELETE_TYPE_EXECUTIONS:
2021-07-14 07:24:52 +12:00
$this->deleteExecutionLogs($this->args['timestamp']);
2020-12-22 07:15:52 +13:00
break;
2020-12-19 03:05:15 +13:00
case DELETE_TYPE_AUDIT:
$this->deleteAuditLogs($this->args['timestamp']);
break;
2020-12-19 03:05:15 +13:00
case DELETE_TYPE_ABUSE:
$this->deleteAbuseLogs($this->args['timestamp']);
break;
2021-02-05 23:57:43 +13:00
case DELETE_TYPE_CERTIFICATES:
2021-07-14 07:24:52 +12:00
$document = new Document($this->args['document']);
2021-02-05 23:57:43 +13:00
$this->deleteCertificates($document);
break;
2021-07-18 19:03:48 +12:00
2020-12-19 21:08:03 +13:00
default:
Console::error('No delete operation for type: '.$type);
break;
}
}
public function shutdown(): void
{
}
2021-07-14 07:24:52 +12:00
/**
* @param Document $document teams document
* @param string $projectId
*/
protected function deleteMemberships(Document $document, $projectId) {
$teamId = $document->getAttribute('teamId', '');
// Delete Memberships
2021-07-14 07:24:52 +12:00
$this->deleteByGroup('memberships', [
new Query('teamId', Query::TYPE_EQUAL, [$teamId])
], $this->getInternalDB($projectId));
}
2021-07-14 07:24:52 +12:00
/**
* @param Document $document project document
*/
protected function deleteProject(Document $document)
2021-07-14 06:44:45 +12:00
{
$projectId = $document->getId();
// Delete all DBs
$this->getExternalDB($projectId)->delete();
$this->getInternalDB($projectId)->delete();
// Delete all storage directories
$uploads = new Local(APP_STORAGE_UPLOADS.'/app-'.$document->getId());
$cache = new Local(APP_STORAGE_CACHE.'/app-'.$document->getId());
$uploads->delete($uploads->getRoot(), true);
$cache->delete($cache->getRoot(), true);
}
2021-07-14 07:24:52 +12:00
/**
* @param Document $document user document
* @param string $projectId
*/
protected function deleteUser(Document $document, $projectId)
2021-07-13 09:57:37 +12:00
{
$userId = $document->getId();
// Tokens and Sessions removed with user document
// Delete Memberships and decrement team membership counts
2021-07-14 07:24:52 +12:00
$this->deleteByGroup('memberships', [
2021-07-13 09:57:37 +12:00
new Query('userId', Query::TYPE_EQUAL, [$userId])
2021-07-14 07:24:52 +12:00
], $this->getInternalDB($projectId), function(Document $document) use ($projectId, $userId) {
2021-07-13 09:57:37 +12:00
if ($document->getAttribute('confirm')) { // Count only confirmed members
$teamId = $document->getAttribute('teamId');
$team = $this->getInternalDB($projectId)->getDocument('teams', $teamId);
if(!$team->isEmpty()) {
2021-07-14 07:24:52 +12:00
$team = $this->getInternalDB($projectId)->updateDocument('teams', $teamId, new Document(\array_merge($team->getArrayCopy(), [
2021-07-13 09:57:37 +12:00
'sum' => \max($team->getAttribute('sum', 0) - 1, 0), // Ensure that sum >= 0
])));
}
}
});
}
2021-07-14 07:24:52 +12:00
/**
* @param int $timestamp
*/
protected function deleteExecutionLogs($timestamp)
2020-12-15 10:26:37 +13:00
{
$this->deleteForProjectIds(function($projectId) use ($timestamp) {
if (!($dbForInternal = $this->getInternalDB($projectId))) {
throw new Exception('Failed to get projectDB for project '.$projectId);
}
// Delete Executions
2021-07-14 07:24:52 +12:00
$this->deleteByGroup('executions', [
new Query('dateCreated', Query::TYPE_LESSER, [$timestamp])
], $dbForInternal);
});
}
2021-07-14 07:24:52 +12:00
/**
* @param int $timestamp
*/
protected function deleteAbuseLogs($timestamp)
{
2020-12-19 03:05:15 +13:00
if($timestamp == 0) {
throw new Exception('Failed to delete audit logs. No timestamp provided');
2020-12-19 03:05:15 +13:00
}
2021-06-07 17:17:29 +12:00
$this->deleteForProjectIds(function($projectId) use ($timestamp){
$timeLimit = new TimeLimit("", 0, 1, $this->getInternalDB($projectId));
2020-12-19 03:08:28 +13:00
$abuse = new Abuse($timeLimit);
$status = $abuse->cleanup($timestamp);
if (!$status) {
2020-12-22 07:15:52 +13:00
throw new Exception('Failed to delete Abuse logs for project '.$projectId);
}
});
}
2021-07-14 07:24:52 +12:00
/**
* @param int $timestamp
*/
protected function deleteAuditLogs($timestamp)
{
2020-12-19 03:05:15 +13:00
if($timestamp == 0) {
throw new Exception('Failed to delete audit logs. No timestamp provided');
}
2021-07-13 09:57:37 +12:00
$this->deleteForProjectIds(function($projectId) use ($timestamp){
2021-06-07 17:17:29 +12:00
$audit = new Audit($this->getInternalDB($projectId));
2020-12-19 03:05:15 +13:00
$status = $audit->cleanup($timestamp);
if (!$status) {
2020-12-22 07:15:52 +13:00
throw new Exception('Failed to delete Audit logs for project'.$projectId);
}
});
}
2021-07-14 07:24:52 +12:00
/**
* @param Document $document function document
* @param string $projectId
*/
protected function deleteFunction(Document $document, $projectId)
2021-07-14 04:10:42 +12:00
{
$dbForInternal = $this->getInternalDB($projectId);
$device = new Local(APP_STORAGE_FUNCTIONS.'/app-'.$projectId);
// Delete Tags
2021-07-14 07:24:52 +12:00
$this->deleteByGroup('tags', [
2021-07-14 04:10:42 +12:00
new Query('functionId', Query::TYPE_EQUAL, [$document->getId()])
2021-07-14 07:24:52 +12:00
], $dbForInternal, function(Document $document) use ($device) {
2021-07-14 04:10:42 +12:00
if ($device->delete($document->getAttribute('path', ''))) {
Console::success('Delete code tag: '.$document->getAttribute('path', ''));
}
else {
Console::error('Failed to delete code tag: '.$document->getAttribute('path', ''));
}
});
// Delete Executions
2021-07-14 07:24:52 +12:00
$this->deleteByGroup('executions', [
2021-07-14 04:10:42 +12:00
new Query('functionId', Query::TYPE_EQUAL, [$document->getId()])
], $dbForInternal);
}
2021-07-14 07:24:52 +12:00
/**
* @param Document $document to be deleted
* @param Database $database to delete it from
* @param callable $callback to perform after document is deleted
*
* @return bool
*/
protected function deleteById(Document $document, Database $database, callable $callback = null): bool
{
Authorization::disable();
2021-07-13 09:57:37 +12:00
// TODO@kodumbeats is it better to pass objects or ID strings?
if($database->deleteDocument($document->getCollection(), $document->getId())) {
Console::success('Deleted document "'.$document->getId().'" successfully');
if(is_callable($callback)) {
$callback($document);
}
return true;
}
else {
Console::error('Failed to delete document: '.$document->getId());
return false;
}
2021-07-14 07:24:52 +12:00
Authorization::reset();
2021-07-13 09:57:37 +12:00
}
2021-07-14 07:24:52 +12:00
/**
* @param callable $callback
*/
protected function deleteForProjectIds(callable $callback)
2020-12-22 07:15:52 +13:00
{
$count = 0;
$chunk = 0;
$limit = 50;
$projects = [];
$sum = $limit;
2020-12-22 07:15:52 +13:00
$executionStart = \microtime(true);
2021-07-14 07:24:52 +12:00
while($sum === $limit) {
$chunk++;
Authorization::disable();
2021-07-14 07:24:52 +12:00
$projects = $this->getConsoleDB()->find('projects', [], $limit);
Authorization::reset();
$projectIds = array_map (function ($project) {
return $project->getId();
}, $projects);
$sum = count($projects);
Console::info('Executing delete function for chunk #'.$chunk.'. Found '.$sum.' projects');
foreach ($projectIds as $projectId) {
$callback($projectId);
$count++;
}
}
2020-12-22 07:15:52 +13:00
$executionEnd = \microtime(true);
Console::info("Found {$count} projects " . ($executionEnd - $executionStart) . " seconds");
2020-12-22 07:15:52 +13:00
}
2021-07-13 09:57:37 +12:00
/**
* @param string $collection collectionID
* @param Query[] $queries
2021-07-14 07:24:52 +12:00
* @param Database $database
2021-07-13 09:57:37 +12:00
* @param callable $callback
*/
2021-07-14 07:24:52 +12:00
protected function deleteByGroup(string $collection, array $queries, Database $database, callable $callback = null)
2021-07-13 09:57:37 +12:00
{
$count = 0;
$chunk = 0;
$limit = 50;
$results = [];
$sum = $limit;
$executionStart = \microtime(true);
while($sum === $limit) {
$chunk++;
2021-07-14 07:24:52 +12:00
Authorization::disable();
2021-07-13 09:57:37 +12:00
$results = $database->find($collection, $queries, $limit, 0);
2021-07-14 07:24:52 +12:00
Authorization::reset();
2021-07-13 09:57:37 +12:00
$sum = count($results);
Console::info('Deleting chunk #'.$chunk.'. Found '.$sum.' documents');
foreach ($results as $document) {
2021-07-14 07:24:52 +12:00
$this->deleteById($document, $database, $callback);
2021-07-13 09:57:37 +12:00
$count++;
}
}
$executionEnd = \microtime(true);
Console::info("Deleted {$count} document by group in " . ($executionEnd - $executionStart) . " seconds");
}
2021-07-14 07:24:52 +12:00
/**
* @param Document $document certificates document
* @return Database
*/
protected function deleteCertificates(Document $document)
2021-02-05 22:05:26 +13:00
{
2021-02-05 23:57:43 +13:00
$domain = $document->getAttribute('domain');
2021-02-05 22:05:26 +13:00
$directory = APP_STORAGE_CERTIFICATES . '/' . $domain;
2021-02-06 00:18:12 +13:00
$checkTraversal = realpath($directory) === $directory;
2021-02-05 22:05:26 +13:00
2021-02-06 00:18:12 +13:00
if($domain && $checkTraversal && is_dir($directory)) {
array_map('unlink', glob($directory.'/*.*'));
2021-02-05 22:05:26 +13:00
rmdir($directory);
2021-02-05 23:57:43 +13:00
Console::info("Deleted certificate files for {$domain}");
} else {
Console::info("No certificate files found for {$domain}");
2021-02-05 22:05:26 +13:00
}
}
2021-07-18 19:03:48 +12:00
protected function deleteBucket(Document $document, string $projectId)
{
2021-07-28 22:06:06 +12:00
$bucketId = $document->getId();
2021-07-18 19:03:48 +12:00
2021-07-28 22:06:06 +12:00
$this->deleteByGroup('files',[
new Query('bucketId', Query::TYPE_EQUAL, [$bucketId])
2021-07-28 22:12:15 +12:00
], $this->getInternalDB($projectId), function () use ($projectId, $bucketId) {
2021-07-28 22:06:06 +12:00
$device = new Local(APP_STORAGE_UPLOADS.'/app-'.$projectId);
$device->deletePath($device->getRoot() . DIRECTORY_SEPARATOR . $bucketId);
});
2021-07-18 19:03:48 +12:00
}
2021-06-07 17:17:29 +12:00
/**
2021-07-14 07:24:52 +12:00
* @param string $projectId
* @return Database
2021-06-07 17:17:29 +12:00
*/
2021-07-14 07:24:52 +12:00
protected function getInternalDB($projectId): Database
2021-06-07 17:17:29 +12:00
{
global $register;
$cache = new Cache(new RedisCache($register->get('cache')));
2021-07-14 07:24:52 +12:00
$dbForInternal = new Database(new MariaDB($register->get('db')), $cache);
2021-06-07 17:17:29 +12:00
$dbForInternal->setNamespace('project_'.$projectId.'_internal'); // Main DB
return $dbForInternal;
}
2021-07-14 06:44:45 +12:00
/**
2021-07-14 07:24:52 +12:00
* @param string $projectId
* @return Database
2021-07-14 06:44:45 +12:00
*/
2021-07-14 07:24:52 +12:00
protected function getExternalDB($projectId): Database
2021-07-14 06:44:45 +12:00
{
global $register;
$cache = new Cache(new RedisCache($register->get('cache')));
2021-07-14 07:24:52 +12:00
$dbForExternal = new Database(new MariaDB($register->get('db')), $cache);
2021-07-14 06:44:45 +12:00
$dbForExternal->setNamespace('project_'.$projectId.'_external'); // Main DB
return $dbForExternal;
}
/**
2021-07-14 07:24:52 +12:00
* @return Database
*/
2021-07-14 07:24:52 +12:00
protected function getConsoleDB(): Database
{
global $register;
$cache = new Cache(new RedisCache($register->get('cache')));
2021-07-14 07:24:52 +12:00
$dbForConsole = new Database(new MariaDB($register->get('db')), $cache);
$dbForConsole->setNamespace('project_console_internal'); // Main DB
return $dbForConsole;
}
}