mirror of
https://github.com/wallabag/wallabag.git
synced 2025-07-22 17:18:37 +00:00
Merge pull request #2920 from wallabag/cleanduplicatescommand
Clean Duplicates Command
This commit is contained in:
commit
ab742ee9c6
7 changed files with 319 additions and 2 deletions
30
docs/en/developer/console_commands.rst
Normal file
30
docs/en/developer/console_commands.rst
Normal file
|
@ -0,0 +1,30 @@
|
||||||
|
Console Commands
|
||||||
|
================
|
||||||
|
|
||||||
|
wallabag has a number of CLI commands to manage a number of tasks. You can list all the commands by executing `bin/console` in the wallabag folder.
|
||||||
|
|
||||||
|
Each command has a help accessible through `bin/console help %command%`.
|
||||||
|
|
||||||
|
.. note::
|
||||||
|
|
||||||
|
If you're in a production environment, remember to add `-e prod` to each command.
|
||||||
|
|
||||||
|
Notable commands
|
||||||
|
----------------
|
||||||
|
|
||||||
|
* `assets:install`: May be helpful if assets are missing.
|
||||||
|
* `cache:clear`: should be run after each update (included in `make update`).
|
||||||
|
* `doctrine:migrations:status`: Output the status of your database migrations.
|
||||||
|
* `fos:user:activate`: Manually activate an user.
|
||||||
|
* `fos:user:change-password`: Change a password for an user.
|
||||||
|
* `fos:user:create`: Create an user.
|
||||||
|
* `fos:user:deactivate`: Deactivate an user (not deleted).
|
||||||
|
* `fos:user:demote`: Removes a role from an user, typically admin rights.
|
||||||
|
* `fos:user:promote`: Adds a role to an user, typically admin rights.
|
||||||
|
* `rabbitmq:*`: May be useful if you're using RabbitMQ.
|
||||||
|
* `wallabag:clean-duplicates`: Removes all entry duplicates for one user or all users
|
||||||
|
* `wallabag:export`: Exports all entries for an user. You can choose the output path of the file.
|
||||||
|
* `wallabag:import`: Import entries to different formats to an user account.
|
||||||
|
* `wallabag:import:redis-worker`: Useful if you use Redis.
|
||||||
|
* `wallabag:install`: (re)Install wallabag
|
||||||
|
* `wallabag:tag:all`: Tag all entries for an user using his/her tagging rules.
|
30
docs/fr/developer/console_commands.rst
Normal file
30
docs/fr/developer/console_commands.rst
Normal file
|
@ -0,0 +1,30 @@
|
||||||
|
Actions en ligne de commande
|
||||||
|
============================
|
||||||
|
|
||||||
|
wallabag a un certain nombre de commandes CLI pour effectuer des tâches. Vous pouvez lister toutes les commandes en exécutant `bin/console` dans le dossier d'installation de wallabag.
|
||||||
|
|
||||||
|
Chaque commande a une aide correspondante accessible via `bin/console help %command%`.
|
||||||
|
|
||||||
|
.. note::
|
||||||
|
|
||||||
|
Si vous êtes dans un environnement de production, souvenez-vous d'ajouter `-e prod` à chaque commande.
|
||||||
|
|
||||||
|
Commandes notables
|
||||||
|
------------------
|
||||||
|
|
||||||
|
* `assets:install`: Peut-être utile si les *assets* sont manquants.
|
||||||
|
* `cache:clear`: doit être exécuté après chaque mise à jour (appelé dans `make update`).
|
||||||
|
* `doctrine:migrations:status`: Montre le statut de vos migrations de vos bases de données.
|
||||||
|
* `fos:user:activate`: Activer manuellement un utilisateur.
|
||||||
|
* `fos:user:change-password`: Changer le mot de passe pour un utilisateur.
|
||||||
|
* `fos:user:create`: Créer un utilisateur.
|
||||||
|
* `fos:user:deactivate`: Désactiver un utilisateur (non supprimé).
|
||||||
|
* `fos:user:demote`: Supprimer un rôle d'un utilisateur, typiquement les droits d'administration.
|
||||||
|
* `fos:user:promote`: Ajoute un rôle à un utilisateur, typiquement les droits d'administration.
|
||||||
|
* `rabbitmq:*`: Peut-être utile si vous utilisez RabbitMQ.
|
||||||
|
* `wallabag:clean-duplicates`: Supprime tous les articles dupliqués pour un utilisateur ou bien tous.
|
||||||
|
* `wallabag:export`: Exporte tous les articles pour un utilisateur. Vous pouvez choisir le chemin du fichier exporté.
|
||||||
|
* `wallabag:import`: Importe les articles en différents formats dans un compte utilisateur.
|
||||||
|
* `wallabag:import:redis-worker`: Utile si vous utilisez Redis.
|
||||||
|
* `wallabag:install`: (ré)Installer wallabag
|
||||||
|
* `wallabag:tag:all`: Tagger tous les articles pour un utilisateur ou une utilisatrice en utilisant ses règles de tags automatiques.
|
119
src/Wallabag/CoreBundle/Command/CleanDuplicatesCommand.php
Normal file
119
src/Wallabag/CoreBundle/Command/CleanDuplicatesCommand.php
Normal file
|
@ -0,0 +1,119 @@
|
||||||
|
<?php
|
||||||
|
|
||||||
|
namespace Wallabag\CoreBundle\Command;
|
||||||
|
|
||||||
|
use Doctrine\ORM\NoResultException;
|
||||||
|
use Symfony\Bundle\FrameworkBundle\Command\ContainerAwareCommand;
|
||||||
|
use Symfony\Component\Console\Input\InputArgument;
|
||||||
|
use Symfony\Component\Console\Input\InputInterface;
|
||||||
|
use Symfony\Component\Console\Output\OutputInterface;
|
||||||
|
use Wallabag\CoreBundle\Entity\Entry;
|
||||||
|
use Wallabag\UserBundle\Entity\User;
|
||||||
|
|
||||||
|
class CleanDuplicatesCommand extends ContainerAwareCommand
|
||||||
|
{
|
||||||
|
/** @var OutputInterface */
|
||||||
|
protected $output;
|
||||||
|
|
||||||
|
protected $duplicates = 0;
|
||||||
|
|
||||||
|
protected function configure()
|
||||||
|
{
|
||||||
|
$this
|
||||||
|
->setName('wallabag:clean-duplicates')
|
||||||
|
->setDescription('Cleans the database for duplicates')
|
||||||
|
->setHelp('This command helps you to clean your articles list in case of duplicates')
|
||||||
|
->addArgument(
|
||||||
|
'username',
|
||||||
|
InputArgument::OPTIONAL,
|
||||||
|
'User to clean'
|
||||||
|
);
|
||||||
|
}
|
||||||
|
|
||||||
|
protected function execute(InputInterface $input, OutputInterface $output)
|
||||||
|
{
|
||||||
|
$this->output = $output;
|
||||||
|
|
||||||
|
$username = $input->getArgument('username');
|
||||||
|
|
||||||
|
if ($username) {
|
||||||
|
try {
|
||||||
|
$user = $this->getUser($username);
|
||||||
|
$this->cleanDuplicates($user);
|
||||||
|
} catch (NoResultException $e) {
|
||||||
|
$output->writeln(sprintf('<error>User "%s" not found.</error>', $username));
|
||||||
|
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
$users = $this->getDoctrine()->getRepository('WallabagUserBundle:User')->findAll();
|
||||||
|
|
||||||
|
$output->writeln(sprintf('Cleaning through %d user accounts', count($users)));
|
||||||
|
|
||||||
|
foreach ($users as $user) {
|
||||||
|
$output->writeln(sprintf('Processing user %s', $user->getUsername()));
|
||||||
|
$this->cleanDuplicates($user);
|
||||||
|
}
|
||||||
|
$output->writeln(sprintf('Finished cleaning. %d duplicates found in total', $this->duplicates));
|
||||||
|
}
|
||||||
|
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @param User $user
|
||||||
|
*/
|
||||||
|
private function cleanDuplicates(User $user)
|
||||||
|
{
|
||||||
|
$em = $this->getContainer()->get('doctrine.orm.entity_manager');
|
||||||
|
$repo = $this->getDoctrine()->getRepository('WallabagCoreBundle:Entry');
|
||||||
|
|
||||||
|
$entries = $repo->getAllEntriesIdAndUrl($user->getId());
|
||||||
|
|
||||||
|
$duplicatesCount = 0;
|
||||||
|
$urls = [];
|
||||||
|
foreach ($entries as $entry) {
|
||||||
|
$url = $this->similarUrl($entry['url']);
|
||||||
|
|
||||||
|
/* @var $entry Entry */
|
||||||
|
if (in_array($url, $urls)) {
|
||||||
|
++$duplicatesCount;
|
||||||
|
|
||||||
|
$em->remove($repo->find($entry['id']));
|
||||||
|
$em->flush(); // Flushing at the end of the loop would require the instance not being online
|
||||||
|
} else {
|
||||||
|
$urls[] = $entry['url'];
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
$this->duplicates += $duplicatesCount;
|
||||||
|
|
||||||
|
$this->output->writeln(sprintf('Cleaned %d duplicates for user %s', $duplicatesCount, $user->getUserName()));
|
||||||
|
}
|
||||||
|
|
||||||
|
private function similarUrl($url)
|
||||||
|
{
|
||||||
|
if (in_array(substr($url, -1), ['/', '#'])) { // get rid of "/" and "#" and the end of urls
|
||||||
|
return substr($url, 0, strlen($url));
|
||||||
|
}
|
||||||
|
|
||||||
|
return $url;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Fetches a user from its username.
|
||||||
|
*
|
||||||
|
* @param string $username
|
||||||
|
*
|
||||||
|
* @return \Wallabag\UserBundle\Entity\User
|
||||||
|
*/
|
||||||
|
private function getUser($username)
|
||||||
|
{
|
||||||
|
return $this->getDoctrine()->getRepository('WallabagUserBundle:User')->findOneByUserName($username);
|
||||||
|
}
|
||||||
|
|
||||||
|
private function getDoctrine()
|
||||||
|
{
|
||||||
|
return $this->getContainer()->get('doctrine');
|
||||||
|
}
|
||||||
|
}
|
|
@ -379,4 +379,34 @@ class EntryRepository extends EntityRepository
|
||||||
->setParameter('userId', $userId)
|
->setParameter('userId', $userId)
|
||||||
->execute();
|
->execute();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Get id and url from all entries
|
||||||
|
* Used for the clean-duplicates command.
|
||||||
|
*/
|
||||||
|
public function getAllEntriesIdAndUrl($userId)
|
||||||
|
{
|
||||||
|
$qb = $this->createQueryBuilder('e')
|
||||||
|
->select('e.id, e.url')
|
||||||
|
->where('e.user = :userid')->setParameter(':userid', $userId);
|
||||||
|
|
||||||
|
return $qb->getQuery()->getArrayResult();
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Find all entries by url and owner.
|
||||||
|
*
|
||||||
|
* @param $url
|
||||||
|
* @param $userId
|
||||||
|
*
|
||||||
|
* @return array
|
||||||
|
*/
|
||||||
|
public function findAllByUrlAndUserId($url, $userId)
|
||||||
|
{
|
||||||
|
return $this->createQueryBuilder('e')
|
||||||
|
->where('e.url = :url')->setParameter('url', urldecode($url))
|
||||||
|
->andWhere('e.user = :user_id')->setParameter('user_id', $userId)
|
||||||
|
->getQuery()
|
||||||
|
->getResult();
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
108
tests/Wallabag/CoreBundle/Command/CleanDuplicatesCommandTest.php
Normal file
108
tests/Wallabag/CoreBundle/Command/CleanDuplicatesCommandTest.php
Normal file
|
@ -0,0 +1,108 @@
|
||||||
|
<?php
|
||||||
|
|
||||||
|
namespace Tests\Wallabag\CoreBundle\Command;
|
||||||
|
|
||||||
|
use Symfony\Bundle\FrameworkBundle\Console\Application;
|
||||||
|
use Symfony\Component\Console\Tester\CommandTester;
|
||||||
|
use Wallabag\CoreBundle\Command\CleanDuplicatesCommand;
|
||||||
|
use Tests\Wallabag\CoreBundle\WallabagCoreTestCase;
|
||||||
|
use Wallabag\CoreBundle\Entity\Entry;
|
||||||
|
|
||||||
|
class CleanDuplicatesCommandTest extends WallabagCoreTestCase
|
||||||
|
{
|
||||||
|
public function testRunCleanDuplicates()
|
||||||
|
{
|
||||||
|
$application = new Application($this->getClient()->getKernel());
|
||||||
|
$application->add(new CleanDuplicatesCommand());
|
||||||
|
|
||||||
|
$command = $application->find('wallabag:clean-duplicates');
|
||||||
|
|
||||||
|
$tester = new CommandTester($command);
|
||||||
|
$tester->execute([
|
||||||
|
'command' => $command->getName(),
|
||||||
|
]);
|
||||||
|
|
||||||
|
$this->assertContains('Cleaning through 3 user accounts', $tester->getDisplay());
|
||||||
|
$this->assertContains('Finished cleaning. 0 duplicates found in total', $tester->getDisplay());
|
||||||
|
}
|
||||||
|
|
||||||
|
public function testRunCleanDuplicatesCommandWithBadUsername()
|
||||||
|
{
|
||||||
|
$application = new Application($this->getClient()->getKernel());
|
||||||
|
$application->add(new CleanDuplicatesCommand());
|
||||||
|
|
||||||
|
$command = $application->find('wallabag:clean-duplicates');
|
||||||
|
|
||||||
|
$tester = new CommandTester($command);
|
||||||
|
$tester->execute([
|
||||||
|
'command' => $command->getName(),
|
||||||
|
'username' => 'unknown',
|
||||||
|
]);
|
||||||
|
|
||||||
|
$this->assertContains('User "unknown" not found', $tester->getDisplay());
|
||||||
|
}
|
||||||
|
|
||||||
|
public function testRunCleanDuplicatesCommandForUser()
|
||||||
|
{
|
||||||
|
$application = new Application($this->getClient()->getKernel());
|
||||||
|
$application->add(new CleanDuplicatesCommand());
|
||||||
|
|
||||||
|
$command = $application->find('wallabag:clean-duplicates');
|
||||||
|
|
||||||
|
$tester = new CommandTester($command);
|
||||||
|
$tester->execute([
|
||||||
|
'command' => $command->getName(),
|
||||||
|
'username' => 'admin',
|
||||||
|
]);
|
||||||
|
|
||||||
|
$this->assertContains('Cleaned 0 duplicates for user admin', $tester->getDisplay());
|
||||||
|
}
|
||||||
|
|
||||||
|
public function testDuplicate()
|
||||||
|
{
|
||||||
|
$url = 'http://www.lemonde.fr/sport/visuel/2017/05/05/rondelle-prison-blanchissage-comprendre-le-hockey-sur-glace_5122587_3242.html';
|
||||||
|
$client = $this->getClient();
|
||||||
|
$em = $client->getContainer()->get('doctrine.orm.entity_manager');
|
||||||
|
|
||||||
|
$this->logInAs('admin');
|
||||||
|
|
||||||
|
$nbEntries = $em->getRepository('WallabagCoreBundle:Entry')->findAllByUrlAndUserId($url, $this->getLoggedInUserId());
|
||||||
|
$this->assertCount(0, $nbEntries);
|
||||||
|
|
||||||
|
$user = $em->getRepository('WallabagUserBundle:User')->findOneById($this->getLoggedInUserId());
|
||||||
|
|
||||||
|
$entry1 = new Entry($user);
|
||||||
|
$entry1->setUrl($url);
|
||||||
|
|
||||||
|
$entry2 = new Entry($user);
|
||||||
|
$entry2->setUrl($url);
|
||||||
|
|
||||||
|
$em->persist($entry1);
|
||||||
|
$em->persist($entry2);
|
||||||
|
|
||||||
|
$em->flush();
|
||||||
|
|
||||||
|
$nbEntries = $em->getRepository('WallabagCoreBundle:Entry')->findAllByUrlAndUserId($url, $this->getLoggedInUserId());
|
||||||
|
$this->assertCount(2, $nbEntries);
|
||||||
|
|
||||||
|
$application = new Application($this->getClient()->getKernel());
|
||||||
|
$application->add(new CleanDuplicatesCommand());
|
||||||
|
|
||||||
|
$command = $application->find('wallabag:clean-duplicates');
|
||||||
|
|
||||||
|
$tester = new CommandTester($command);
|
||||||
|
$tester->execute([
|
||||||
|
'command' => $command->getName(),
|
||||||
|
'username' => 'admin',
|
||||||
|
]);
|
||||||
|
|
||||||
|
$this->assertContains('Cleaned 1 duplicates for user admin', $tester->getDisplay());
|
||||||
|
|
||||||
|
$nbEntries = $em->getRepository('WallabagCoreBundle:Entry')->findAllByUrlAndUserId($url, $this->getLoggedInUserId());
|
||||||
|
$this->assertCount(1, $nbEntries);
|
||||||
|
|
||||||
|
$query = $em->createQuery('DELETE FROM Wallabag\CoreBundle\Entity\Entry e WHERE e.url = :url');
|
||||||
|
$query->setParameter('url', $url);
|
||||||
|
$query->execute();
|
||||||
|
}
|
||||||
|
}
|
|
@ -70,7 +70,7 @@ class ExportCommandTest extends WallabagCoreTestCase
|
||||||
$tester->execute([
|
$tester->execute([
|
||||||
'command' => $command->getName(),
|
'command' => $command->getName(),
|
||||||
'username' => 'admin',
|
'username' => 'admin',
|
||||||
'filepath' => 'specialexport.json'
|
'filepath' => 'specialexport.json',
|
||||||
]);
|
]);
|
||||||
|
|
||||||
$this->assertFileExists('specialexport.json');
|
$this->assertFileExists('specialexport.json');
|
||||||
|
|
|
@ -111,7 +111,7 @@ class ContentProxyTest extends \PHPUnit_Framework_TestCase
|
||||||
|
|
||||||
$this->assertEquals('http://domain.io', $entry->getUrl());
|
$this->assertEquals('http://domain.io', $entry->getUrl());
|
||||||
$this->assertEquals('my title', $entry->getTitle());
|
$this->assertEquals('my title', $entry->getTitle());
|
||||||
$this->assertEquals($this->fetchingErrorMessage . '<p><i>But we found a short description: </i></p>desc', $entry->getContent());
|
$this->assertEquals($this->fetchingErrorMessage.'<p><i>But we found a short description: </i></p>desc', $entry->getContent());
|
||||||
$this->assertEmpty($entry->getPreviewPicture());
|
$this->assertEmpty($entry->getPreviewPicture());
|
||||||
$this->assertEmpty($entry->getLanguage());
|
$this->assertEmpty($entry->getLanguage());
|
||||||
$this->assertEmpty($entry->getHttpStatus());
|
$this->assertEmpty($entry->getHttpStatus());
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue