Merge pull request #3271 from wallabag/store-resolved-url

Add `given_url` in Entry table to check if a redirected url has already added
This commit is contained in:
Jérémy Benoist 2019-06-05 11:38:00 +02:00 committed by GitHub
commit 16e1c07553
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
5 changed files with 164 additions and 11 deletions

View file

@ -0,0 +1,54 @@
<?php
namespace Application\Migrations;
use Doctrine\DBAL\Schema\Schema;
use Wallabag\CoreBundle\Doctrine\WallabagMigration;
/**
* Added `given_url` & `hashed_given_url` field in entry table.
*/
class Version20190601125843 extends WallabagMigration
{
/**
* @param Schema $schema
*/
public function up(Schema $schema)
{
$entryTable = $schema->getTable($this->getTable('entry'));
if (!$entryTable->hasColumn('given_url')) {
$entryTable->addColumn('given_url', 'text', [
'notnull' => false,
]);
}
if (!$entryTable->hasColumn('hashed_given_url')) {
$entryTable->addColumn('hashed_given_url', 'text', [
'length' => 40,
'notnull' => false,
]);
}
// 40 = length of sha1 field hashed_given_url
$entryTable->addIndex(['user_id', 'hashed_given_url'], 'hashed_given_url_user_id', [], ['lengths' => [null, 40]]);
}
/**
* @param Schema $schema
*/
public function down(Schema $schema)
{
$entryTable = $schema->getTable($this->getTable('entry'));
if ($entryTable->hasColumn('given_url')) {
$entryTable->dropColumn('given_url');
}
if ($entryTable->hasColumn('hashed_given_url')) {
$entryTable->dropColumn('hashed_given_url');
}
$entryTable->dropIndex('hashed_given_url_user_id');
}
}

View file

@ -27,7 +27,8 @@ use Wallabag\UserBundle\Entity\User;
* indexes={ * indexes={
* @ORM\Index(name="created_at", columns={"created_at"}), * @ORM\Index(name="created_at", columns={"created_at"}),
* @ORM\Index(name="uid", columns={"uid"}), * @ORM\Index(name="uid", columns={"uid"}),
* @ORM\Index(name="hashed_url_user_id", columns={"user_id", "hashed_url"}, options={"lengths"={null, 40}}) * @ORM\Index(name="hashed_url_user_id", columns={"user_id", "hashed_url"}, options={"lengths"={null, 40}}),
* @ORM\Index(name="hashed_given_url_user_id", columns={"user_id", "hashed_given_url"}, options={"lengths"={null, 40}})
* } * }
* ) * )
* @ORM\HasLifecycleCallbacks() * @ORM\HasLifecycleCallbacks()
@ -68,6 +69,8 @@ class Entry
private $title; private $title;
/** /**
* Define the url fetched by wallabag (the final url after potential redirections).
*
* @var string * @var string
* *
* @Assert\NotBlank() * @Assert\NotBlank()
@ -84,6 +87,35 @@ class Entry
*/ */
private $hashedUrl; private $hashedUrl;
/**
* From where user retrieved/found the url (an other article, a twitter, or the given_url if non are provided).
*
* @var string
*
* @ORM\Column(name="origin_url", type="text", nullable=true)
*
* @Groups({"entries_for_user", "export_all"})
*/
private $originUrl;
/**
* Define the url entered by the user (without redirections).
*
* @var string
*
* @ORM\Column(name="given_url", type="text", nullable=true)
*
* @Groups({"entries_for_user", "export_all"})
*/
private $givenUrl;
/**
* @var string
*
* @ORM\Column(name="hashed_given_url", type="string", length=40, nullable=true)
*/
private $hashedGivenUrl;
/** /**
* @var bool * @var bool
* *
@ -263,15 +295,6 @@ class Entry
*/ */
private $tags; private $tags;
/**
* @var string
*
* @ORM\Column(name="origin_url", type="text", nullable=true)
*
* @Groups({"entries_for_user", "export_all"})
*/
private $originUrl;
/* /*
* @param User $user * @param User $user
*/ */
@ -922,6 +945,31 @@ class Entry
return $this->originUrl; return $this->originUrl;
} }
/**
* Set given url.
*
* @param string $givenUrl
*
* @return Entry
*/
public function setGivenUrl($givenUrl)
{
$this->givenUrl = $givenUrl;
$this->hashedGivenUrl = UrlHasher::hashUrl($givenUrl);
return $this;
}
/**
* Get given url.
*
* @return string
*/
public function getGivenUrl()
{
return $this->givenUrl;
}
/** /**
* @return string * @return string
*/ */

View file

@ -78,6 +78,8 @@ class ContentProxy
$entry->setUrl($url); $entry->setUrl($url);
} }
$entry->setGivenUrl($url);
$this->stockEntry($entry, $content); $this->stockEntry($entry, $content);
} }

View file

@ -366,6 +366,7 @@ class EntryRepository extends EntityRepository
*/ */
public function findByHashedUrlAndUserId($hashedUrl, $userId) public function findByHashedUrlAndUserId($hashedUrl, $userId)
{ {
// try first using hashed_url (to use the database index)
$res = $this->createQueryBuilder('e') $res = $this->createQueryBuilder('e')
->where('e.hashedUrl = :hashed_url')->setParameter('hashed_url', $hashedUrl) ->where('e.hashedUrl = :hashed_url')->setParameter('hashed_url', $hashedUrl)
->andWhere('e.user = :user_id')->setParameter('user_id', $userId) ->andWhere('e.user = :user_id')->setParameter('user_id', $userId)
@ -376,6 +377,17 @@ class EntryRepository extends EntityRepository
return current($res); return current($res);
} }
// then try using hashed_given_url (to use the database index)
$res = $this->createQueryBuilder('e')
->where('e.hashedGivenUrl = :hashed_given_url')->setParameter('hashed_given_url', $hashedUrl)
->andWhere('e.user = :user_id')->setParameter('user_id', $userId)
->getQuery()
->getResult();
if (\count($res)) {
return current($res);
}
return false; return false;
} }

View file

@ -166,7 +166,6 @@ class EntryControllerTest extends WallabagCoreTestCase
$this->assertSame($this->url, $content->getUrl()); $this->assertSame($this->url, $content->getUrl());
$this->assertContains('Google', $content->getTitle()); $this->assertContains('Google', $content->getTitle());
$this->assertSame('fr', $content->getLanguage()); $this->assertSame('fr', $content->getLanguage());
$this->assertSame('2015-03-28 11:43:19', $content->getPublishedAt()->format('Y-m-d H:i:s'));
$this->assertArrayHasKey('x-frame-options', $content->getHeaders()); $this->assertArrayHasKey('x-frame-options', $content->getHeaders());
$client->getContainer()->get('craue_config')->set('store_article_headers', 0); $client->getContainer()->get('craue_config')->set('store_article_headers', 0);
} }
@ -266,6 +265,44 @@ class EntryControllerTest extends WallabagCoreTestCase
$this->assertContains('/view/', $client->getResponse()->getTargetUrl()); $this->assertContains('/view/', $client->getResponse()->getTargetUrl());
} }
/**
* This test will require an internet connection.
*/
public function testPostNewOkUrlExistWithRedirection()
{
$this->logInAs('admin');
$client = $this->getClient();
$url = 'https://wllbg.org/test-redirect/c51c';
$crawler = $client->request('GET', '/new');
$this->assertSame(200, $client->getResponse()->getStatusCode());
$form = $crawler->filter('form[name=entry]')->form();
$data = [
'entry[url]' => $url,
];
$client->submit($form, $data);
$crawler = $client->request('GET', '/new');
$this->assertSame(200, $client->getResponse()->getStatusCode());
$form = $crawler->filter('form[name=entry]')->form();
$data = [
'entry[url]' => $url,
];
$client->submit($form, $data);
$this->assertSame(302, $client->getResponse()->getStatusCode());
$this->assertContains('/view/', $client->getResponse()->getTargetUrl());
}
/** /**
* This test will require an internet connection. * This test will require an internet connection.
*/ */