]>
Commit | Line | Data |
---|---|---|
19d9efab JB |
1 | <?php |
2 | ||
3 | namespace Wallabag\ImportBundle\Import; | |
4 | ||
5 | use Psr\Log\LoggerInterface; | |
6 | use Psr\Log\NullLogger; | |
7 | use Doctrine\ORM\EntityManager; | |
8 | use Wallabag\CoreBundle\Helper\ContentProxy; | |
9 | use Wallabag\CoreBundle\Entity\Entry; | |
8664069e | 10 | use Wallabag\CoreBundle\Entity\Tag; |
3849a9f3 | 11 | use Wallabag\UserBundle\Entity\User; |
b3437d58 | 12 | use OldSound\RabbitMqBundle\RabbitMq\ProducerInterface; |
19d9efab JB |
13 | |
14 | abstract class AbstractImport implements ImportInterface | |
15 | { | |
16 | protected $em; | |
17 | protected $logger; | |
18 | protected $contentProxy; | |
c98db1b6 JB |
19 | protected $producer; |
20 | protected $user; | |
21 | protected $markAsRead; | |
3aca0a9f JB |
22 | protected $skippedEntries = 0; |
23 | protected $importedEntries = 0; | |
c80cc01a | 24 | protected $queuedEntries = 0; |
19d9efab JB |
25 | |
26 | public function __construct(EntityManager $em, ContentProxy $contentProxy) | |
27 | { | |
28 | $this->em = $em; | |
29 | $this->logger = new NullLogger(); | |
30 | $this->contentProxy = $contentProxy; | |
31 | } | |
32 | ||
33 | public function setLogger(LoggerInterface $logger) | |
34 | { | |
35 | $this->logger = $logger; | |
36 | } | |
37 | ||
c98db1b6 | 38 | /** |
b3437d58 | 39 | * Set RabbitMQ/Redis Producer to send each entry to a queue. |
c98db1b6 JB |
40 | * This method should be called when user has enabled RabbitMQ. |
41 | * | |
b3437d58 | 42 | * @param ProducerInterface $producer |
c98db1b6 | 43 | */ |
b3437d58 | 44 | public function setProducer(ProducerInterface $producer) |
c98db1b6 JB |
45 | { |
46 | $this->producer = $producer; | |
47 | } | |
48 | ||
49 | /** | |
50 | * Set current user. | |
51 | * Could the current *connected* user or one retrieve by the consumer. | |
52 | * | |
3849a9f3 | 53 | * @param User $user |
c98db1b6 | 54 | */ |
3849a9f3 | 55 | public function setUser(User $user) |
c98db1b6 JB |
56 | { |
57 | $this->user = $user; | |
58 | } | |
59 | ||
60 | /** | |
61 | * Set whether articles must be all marked as read. | |
62 | * | |
63 | * @param bool $markAsRead | |
64 | */ | |
65 | public function setMarkAsRead($markAsRead) | |
66 | { | |
67 | $this->markAsRead = $markAsRead; | |
68 | ||
69 | return $this; | |
70 | } | |
71 | ||
72 | /** | |
73 | * Get whether articles must be all marked as read. | |
74 | */ | |
75 | public function getMarkAsRead() | |
76 | { | |
77 | return $this->markAsRead; | |
78 | } | |
79 | ||
19d9efab JB |
80 | /** |
81 | * Fetch content from the ContentProxy (using graby). | |
82 | * If it fails return false instead of the updated entry. | |
83 | * | |
84 | * @param Entry $entry Entry to update | |
85 | * @param string $url Url to grab content for | |
86 | * @param array $content An array with AT LEAST keys title, html, url, language & content_type to skip the fetchContent from the url | |
87 | * | |
88 | * @return Entry|false | |
89 | */ | |
90 | protected function fetchContent(Entry $entry, $url, array $content = []) | |
91 | { | |
92 | try { | |
93 | return $this->contentProxy->updateEntry($entry, $url, $content); | |
94 | } catch (\Exception $e) { | |
95 | return false; | |
96 | } | |
97 | } | |
c98db1b6 JB |
98 | |
99 | /** | |
100 | * Parse and insert all given entries. | |
101 | * | |
102 | * @param $entries | |
103 | */ | |
104 | protected function parseEntries($entries) | |
105 | { | |
106 | $i = 1; | |
107 | ||
108 | foreach ($entries as $importedEntry) { | |
109 | $entry = $this->parseEntry($importedEntry); | |
110 | ||
111 | if (null === $entry) { | |
112 | continue; | |
113 | } | |
114 | ||
115 | // flush every 20 entries | |
116 | if (($i % 20) === 0) { | |
117 | $this->em->flush(); | |
8664069e JB |
118 | |
119 | // clear only affected entities | |
120 | $this->em->clear(Entry::class); | |
121 | $this->em->clear(Tag::class); | |
c98db1b6 JB |
122 | } |
123 | ++$i; | |
124 | } | |
125 | ||
126 | $this->em->flush(); | |
127 | } | |
128 | ||
3849a9f3 JB |
129 | /** |
130 | * Parse entries and send them to the queue. | |
131 | * It should just be a simple loop on all item, no call to the database should be done | |
132 | * to speedup queuing. | |
133 | * | |
134 | * Faster parse entries for Producer. | |
135 | * We don't care to make check at this time. They'll be done by the consumer. | |
136 | * | |
137 | * @param array $entries | |
138 | */ | |
139 | protected function parseEntriesForProducer(array $entries) | |
140 | { | |
141 | foreach ($entries as $importedEntry) { | |
142 | // set userId for the producer (it won't know which user is connected) | |
143 | $importedEntry['userId'] = $this->user->getId(); | |
144 | ||
145 | if ($this->markAsRead) { | |
146 | $importedEntry = $this->setEntryAsRead($importedEntry); | |
147 | } | |
148 | ||
c80cc01a | 149 | ++$this->queuedEntries; |
3849a9f3 JB |
150 | |
151 | $this->producer->publish(json_encode($importedEntry)); | |
152 | } | |
153 | } | |
154 | ||
c80cc01a JB |
155 | /** |
156 | * {@inheritdoc} | |
157 | */ | |
158 | public function getSummary() | |
159 | { | |
160 | return [ | |
161 | 'skipped' => $this->skippedEntries, | |
162 | 'imported' => $this->importedEntries, | |
163 | 'queued' => $this->queuedEntries, | |
164 | ]; | |
165 | } | |
166 | ||
c98db1b6 JB |
167 | /** |
168 | * Parse one entry. | |
169 | * | |
170 | * @param array $importedEntry | |
171 | * | |
172 | * @return Entry | |
173 | */ | |
174 | abstract public function parseEntry(array $importedEntry); | |
3849a9f3 JB |
175 | |
176 | /** | |
177 | * Set current imported entry to archived / read. | |
178 | * Implementation is different accross all imports. | |
179 | * | |
180 | * @param array $importedEntry | |
181 | * | |
182 | * @return array | |
183 | */ | |
184 | abstract protected function setEntryAsRead(array $importedEntry); | |
19d9efab | 185 | } |