mirror of
https://github.com/wallabag/wallabag.git
synced 2025-04-29 05:04:42 +00:00
We got some imports with a missing `url` field generating some errors while trying to retrieve an existing entry with that url. Introducing the `validateEntry` allow us to dismiss a message when it doesn't have an url (or other missing stuff in the future)
236 lines
5.9 KiB
PHP
236 lines
5.9 KiB
PHP
<?php
|
|
|
|
namespace Wallabag\ImportBundle\Import;
|
|
|
|
use Wallabag\CoreBundle\Entity\Entry;
|
|
use Wallabag\CoreBundle\Event\EntrySavedEvent;
|
|
|
|
abstract class BrowserImport extends AbstractImport
|
|
{
|
|
protected $filepath;
|
|
|
|
/**
|
|
* {@inheritdoc}
|
|
*/
|
|
abstract public function getName();
|
|
|
|
/**
|
|
* {@inheritdoc}
|
|
*/
|
|
abstract public function getUrl();
|
|
|
|
/**
|
|
* {@inheritdoc}
|
|
*/
|
|
abstract public function getDescription();
|
|
|
|
/**
|
|
* {@inheritdoc}
|
|
*/
|
|
public function import()
|
|
{
|
|
if (!$this->user) {
|
|
$this->logger->error('Wallabag Browser Import: user is not defined');
|
|
|
|
return false;
|
|
}
|
|
|
|
if (!file_exists($this->filepath) || !is_readable($this->filepath)) {
|
|
$this->logger->error('Wallabag Browser Import: unable to read file', ['filepath' => $this->filepath]);
|
|
|
|
return false;
|
|
}
|
|
|
|
$data = json_decode(file_get_contents($this->filepath), true);
|
|
|
|
if (empty($data)) {
|
|
$this->logger->error('Wallabag Browser: no entries in imported file');
|
|
|
|
return false;
|
|
}
|
|
|
|
if ($this->producer) {
|
|
$this->parseEntriesForProducer($data);
|
|
|
|
return true;
|
|
}
|
|
|
|
$this->parseEntries($data);
|
|
|
|
return true;
|
|
}
|
|
|
|
/**
|
|
* Set file path to the json file.
|
|
*
|
|
* @param string $filepath
|
|
*/
|
|
public function setFilepath($filepath)
|
|
{
|
|
$this->filepath = $filepath;
|
|
|
|
return $this;
|
|
}
|
|
|
|
/**
|
|
* {@inheritdoc}
|
|
*/
|
|
public function parseEntry(array $importedEntry)
|
|
{
|
|
if ((!array_key_exists('guid', $importedEntry) || (!array_key_exists('id', $importedEntry))) && \is_array(reset($importedEntry))) {
|
|
if ($this->producer) {
|
|
$this->parseEntriesForProducer($importedEntry);
|
|
|
|
return;
|
|
}
|
|
|
|
$this->parseEntries($importedEntry);
|
|
|
|
return;
|
|
}
|
|
|
|
if (array_key_exists('children', $importedEntry)) {
|
|
if ($this->producer) {
|
|
$this->parseEntriesForProducer($importedEntry['children']);
|
|
|
|
return;
|
|
}
|
|
|
|
$this->parseEntries($importedEntry['children']);
|
|
|
|
return;
|
|
}
|
|
|
|
if (!array_key_exists('uri', $importedEntry) && !array_key_exists('url', $importedEntry)) {
|
|
return;
|
|
}
|
|
|
|
$url = array_key_exists('uri', $importedEntry) ? $importedEntry['uri'] : $importedEntry['url'];
|
|
|
|
$existingEntry = $this->em
|
|
->getRepository('WallabagCoreBundle:Entry')
|
|
->findByUrlAndUserId($url, $this->user->getId());
|
|
|
|
if (false !== $existingEntry) {
|
|
++$this->skippedEntries;
|
|
|
|
return;
|
|
}
|
|
|
|
$data = $this->prepareEntry($importedEntry);
|
|
|
|
$entry = new Entry($this->user);
|
|
$entry->setUrl($data['url']);
|
|
$entry->setTitle($data['title']);
|
|
|
|
// update entry with content (in case fetching failed, the given entry will be return)
|
|
$this->fetchContent($entry, $data['url'], $data);
|
|
|
|
if (array_key_exists('tags', $data)) {
|
|
$this->tagsAssigner->assignTagsToEntry(
|
|
$entry,
|
|
$data['tags']
|
|
);
|
|
}
|
|
|
|
$entry->setArchived($data['is_archived']);
|
|
|
|
if (!empty($data['created_at'])) {
|
|
$dt = new \DateTime();
|
|
$entry->setCreatedAt($dt->setTimestamp($data['created_at']));
|
|
}
|
|
|
|
$this->em->persist($entry);
|
|
++$this->importedEntries;
|
|
|
|
return $entry;
|
|
}
|
|
|
|
/**
|
|
* Parse and insert all given entries.
|
|
*
|
|
* @param array $entries
|
|
*/
|
|
protected function parseEntries(array $entries)
|
|
{
|
|
$i = 1;
|
|
$entryToBeFlushed = [];
|
|
|
|
foreach ($entries as $importedEntry) {
|
|
if ((array) $importedEntry !== $importedEntry) {
|
|
continue;
|
|
}
|
|
|
|
$entry = $this->parseEntry($importedEntry);
|
|
|
|
if (null === $entry) {
|
|
continue;
|
|
}
|
|
|
|
// @see AbstractImport
|
|
$entryToBeFlushed[] = $entry;
|
|
|
|
// flush every 20 entries
|
|
if (0 === ($i % 20)) {
|
|
$this->em->flush();
|
|
|
|
foreach ($entryToBeFlushed as $entry) {
|
|
$this->eventDispatcher->dispatch(EntrySavedEvent::NAME, new EntrySavedEvent($entry));
|
|
}
|
|
|
|
$entryToBeFlushed = [];
|
|
}
|
|
++$i;
|
|
}
|
|
|
|
$this->em->flush();
|
|
|
|
if (!empty($entryToBeFlushed)) {
|
|
foreach ($entryToBeFlushed as $entry) {
|
|
$this->eventDispatcher->dispatch(EntrySavedEvent::NAME, new EntrySavedEvent($entry));
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Parse entries and send them to the queue.
|
|
* It should just be a simple loop on all item, no call to the database should be done
|
|
* to speedup queuing.
|
|
*
|
|
* Faster parse entries for Producer.
|
|
* We don't care to make check at this time. They'll be done by the consumer.
|
|
*
|
|
* @param array $entries
|
|
*/
|
|
protected function parseEntriesForProducer(array $entries)
|
|
{
|
|
foreach ($entries as $importedEntry) {
|
|
if ((array) $importedEntry !== $importedEntry) {
|
|
continue;
|
|
}
|
|
|
|
// set userId for the producer (it won't know which user is connected)
|
|
$importedEntry['userId'] = $this->user->getId();
|
|
|
|
if ($this->markAsRead) {
|
|
$importedEntry = $this->setEntryAsRead($importedEntry);
|
|
}
|
|
|
|
++$this->queuedEntries;
|
|
|
|
$this->producer->publish(json_encode($importedEntry));
|
|
}
|
|
}
|
|
|
|
/**
|
|
* {@inheritdoc}
|
|
*/
|
|
protected function setEntryAsRead(array $importedEntry)
|
|
{
|
|
$importedEntry['is_archived'] = 1;
|
|
|
|
return $importedEntry;
|
|
}
|
|
|
|
abstract protected function prepareEntry(array $entry = []);
|
|
}
|