wallabag/src/Wallabag/CoreBundle/Command/CleanDuplicatesCommand.php

115 lines
3.4 KiB
PHP
Raw Normal View History

2017-02-24 10:27:03 +00:00
<?php
namespace Wallabag\CoreBundle\Command;
use Doctrine\ORM\NoResultException;
use Symfony\Bundle\FrameworkBundle\Command\ContainerAwareCommand;
use Symfony\Component\Console\Input\InputArgument;
use Symfony\Component\Console\Input\InputInterface;
use Symfony\Component\Console\Output\OutputInterface;
use Wallabag\CoreBundle\Entity\Entry;
use Wallabag\UserBundle\Entity\User;
class CleanDuplicatesCommand extends ContainerAwareCommand
{
/** @var OutputInterface */
protected $output;
protected $duplicates = 0;
protected function configure()
{
$this
->setName('wallabag:clean-duplicates')
->setDescription('Cleans the database for duplicates')
->setHelp('This command helps you to clean your articles list in case of duplicates')
->addArgument(
'username',
InputArgument::OPTIONAL,
'User to clean'
);
}
protected function execute(InputInterface $input, OutputInterface $output)
{
$this->output = $output;
$username = $input->getArgument('username');
if ($username) {
try {
$user = $this->getUser($username);
$this->cleanDuplicates($user);
} catch (NoResultException $e) {
$output->writeln(sprintf('<error>User "%s" not found.</error>', $username));
return 1;
}
} else {
2017-06-10 11:19:43 +00:00
$users = $this->getContainer()->get('wallabag_user.user_repository')->findAll();
2017-02-24 10:27:03 +00:00
$output->writeln(sprintf('Cleaning through %d user accounts', count($users)));
foreach ($users as $user) {
$output->writeln(sprintf('Processing user %s', $user->getUsername()));
$this->cleanDuplicates($user);
}
$output->writeln(sprintf('Finished cleaning. %d duplicates found in total', $this->duplicates));
}
return 0;
}
/**
* @param User $user
*/
private function cleanDuplicates(User $user)
{
$em = $this->getContainer()->get('doctrine.orm.entity_manager');
2017-06-10 11:19:43 +00:00
$repo = $this->getContainer()->get('wallabag_core.entry_repository');
2017-02-24 10:27:03 +00:00
$entries = $repo->getAllEntriesIdAndUrl($user->getId());
$duplicatesCount = 0;
$urls = [];
foreach ($entries as $entry) {
$url = $this->similarUrl($entry['url']);
/* @var $entry Entry */
2017-07-01 07:52:38 +00:00
if (in_array($url, $urls, true)) {
2017-02-24 10:27:03 +00:00
++$duplicatesCount;
$em->remove($repo->find($entry['id']));
$em->flush(); // Flushing at the end of the loop would require the instance not being online
} else {
$urls[] = $entry['url'];
}
}
$this->duplicates += $duplicatesCount;
$this->output->writeln(sprintf('Cleaned %d duplicates for user %s', $duplicatesCount, $user->getUserName()));
}
private function similarUrl($url)
{
2017-07-01 07:52:38 +00:00
if (in_array(substr($url, -1), ['/', '#'], true)) { // get rid of "/" and "#" and the end of urls
2017-02-24 10:27:03 +00:00
return substr($url, 0, strlen($url));
}
return $url;
}
/**
* Fetches a user from its username.
*
* @param string $username
*
* @return \Wallabag\UserBundle\Entity\User
*/
private function getUser($username)
{
2017-06-10 11:19:43 +00:00
return $this->getContainer()->get('wallabag_user.user_repository')->findOneByUserName($username);
2017-02-24 10:27:03 +00:00
}
}