]> git.immae.eu Git - github/wallabag/wallabag.git/blame - tests/Wallabag/CoreBundle/Helper/ContentProxyTest.php
Put default fetching error title in global config
[github/wallabag/wallabag.git] / tests / Wallabag / CoreBundle / Helper / ContentProxyTest.php
CommitLineData
558d9aab
JB
1<?php
2
a2c1b94e 3namespace Tests\Wallabag\CoreBundle\Helper;
558d9aab 4
0c5bcd82 5use Psr\Log\NullLogger;
558d9aab 6use Wallabag\CoreBundle\Helper\ContentProxy;
c2656f96
JB
7use Wallabag\CoreBundle\Entity\Entry;
8use Wallabag\CoreBundle\Entity\Tag;
619cc453 9use Wallabag\UserBundle\Entity\User;
6bc6fb1f 10use Wallabag\CoreBundle\Helper\RuleBasedTagger;
74a75f7d 11use Graby\Graby;
f0378b4d
JB
12use Monolog\Handler\TestHandler;
13use Monolog\Logger;
558d9aab 14
a2c1b94e 15class ContentProxyTest extends \PHPUnit_Framework_TestCase
558d9aab 16{
ac1509a6 17 private $fetchingErrorMessage = 'wallabag can\'t retrieve contents for this article. Please <a href="http://doc.wallabag.org/en/user/errors_during_fetching.html#how-can-i-help-to-fix-that">troubleshoot this issue</a>.';
a2c1b94e 18
4d0ec0e7
JB
19 public function testWithBadUrl()
20 {
21 $tagger = $this->getTaggerMock();
22 $tagger->expects($this->once())
23 ->method('tag');
24
25 $graby = $this->getMockBuilder('Graby\Graby')
4094ea47 26 ->setMethods(['fetchContent'])
4d0ec0e7
JB
27 ->disableOriginalConstructor()
28 ->getMock();
29
30 $graby->expects($this->any())
31 ->method('fetchContent')
4094ea47 32 ->willReturn([
4d0ec0e7
JB
33 'html' => false,
34 'title' => '',
35 'url' => '',
36 'content_type' => '',
37 'language' => '',
4094ea47 38 ]);
4d0ec0e7 39
6bc6fb1f 40 $proxy = new ContentProxy($graby, $tagger, $this->getLogger(), $this->fetchingErrorMessage);
7aba665e
JC
41 $entry = new Entry(new User());
42 $proxy->updateEntry($entry, 'http://user@:80');
4d0ec0e7
JB
43
44 $this->assertEquals('http://user@:80', $entry->getUrl());
45 $this->assertEmpty($entry->getTitle());
fc2b7bda 46 $this->assertEquals($this->fetchingErrorMessage, $entry->getContent());
4d0ec0e7
JB
47 $this->assertEmpty($entry->getPreviewPicture());
48 $this->assertEmpty($entry->getMimetype());
49 $this->assertEmpty($entry->getLanguage());
50 $this->assertEquals(0.0, $entry->getReadingTime());
51 $this->assertEquals(false, $entry->getDomainName());
52 }
53
558d9aab
JB
54 public function testWithEmptyContent()
55 {
f530f7f5
KG
56 $tagger = $this->getTaggerMock();
57 $tagger->expects($this->once())
58 ->method('tag');
59
558d9aab 60 $graby = $this->getMockBuilder('Graby\Graby')
4094ea47 61 ->setMethods(['fetchContent'])
558d9aab
JB
62 ->disableOriginalConstructor()
63 ->getMock();
64
65 $graby->expects($this->any())
66 ->method('fetchContent')
4094ea47 67 ->willReturn([
98f0929f
JB
68 'html' => false,
69 'title' => '',
70 'url' => '',
71 'content_type' => '',
72 'language' => '',
4094ea47 73 ]);
558d9aab 74
6bc6fb1f 75 $proxy = new ContentProxy($graby, $tagger, $this->getLogger(), $this->fetchingErrorMessage);
7aba665e
JC
76 $entry = new Entry(new User());
77 $proxy->updateEntry($entry, 'http://0.0.0.0');
558d9aab
JB
78
79 $this->assertEquals('http://0.0.0.0', $entry->getUrl());
80 $this->assertEmpty($entry->getTitle());
fc2b7bda 81 $this->assertEquals($this->fetchingErrorMessage, $entry->getContent());
558d9aab
JB
82 $this->assertEmpty($entry->getPreviewPicture());
83 $this->assertEmpty($entry->getMimetype());
98f0929f 84 $this->assertEmpty($entry->getLanguage());
da3d4998
JB
85 $this->assertEquals(0.0, $entry->getReadingTime());
86 $this->assertEquals('0.0.0.0', $entry->getDomainName());
558d9aab
JB
87 }
88
89 public function testWithEmptyContentButOG()
90 {
f530f7f5
KG
91 $tagger = $this->getTaggerMock();
92 $tagger->expects($this->once())
93 ->method('tag');
94
558d9aab 95 $graby = $this->getMockBuilder('Graby\Graby')
4094ea47 96 ->setMethods(['fetchContent'])
558d9aab
JB
97 ->disableOriginalConstructor()
98 ->getMock();
99
100 $graby->expects($this->any())
101 ->method('fetchContent')
4094ea47 102 ->willReturn([
98f0929f
JB
103 'html' => false,
104 'title' => '',
105 'url' => '',
106 'content_type' => '',
107 'language' => '',
10b35097 108 'status' => '',
4094ea47 109 'open_graph' => [
98f0929f
JB
110 'og_title' => 'my title',
111 'og_description' => 'desc',
4094ea47
JB
112 ],
113 ]);
558d9aab 114
6bc6fb1f 115 $proxy = new ContentProxy($graby, $tagger, $this->getLogger(), $this->fetchingErrorMessage);
7aba665e
JC
116 $entry = new Entry(new User());
117 $proxy->updateEntry($entry, 'http://domain.io');
558d9aab 118
da3d4998 119 $this->assertEquals('http://domain.io', $entry->getUrl());
558d9aab 120 $this->assertEquals('my title', $entry->getTitle());
d09fe4d2 121 $this->assertEquals($this->fetchingErrorMessage.'<p><i>But we found a short description: </i></p>desc', $entry->getContent());
558d9aab 122 $this->assertEmpty($entry->getPreviewPicture());
98f0929f 123 $this->assertEmpty($entry->getLanguage());
10b35097 124 $this->assertEmpty($entry->getHttpStatus());
558d9aab 125 $this->assertEmpty($entry->getMimetype());
da3d4998
JB
126 $this->assertEquals(0.0, $entry->getReadingTime());
127 $this->assertEquals('domain.io', $entry->getDomainName());
558d9aab
JB
128 }
129
130 public function testWithContent()
131 {
f530f7f5
KG
132 $tagger = $this->getTaggerMock();
133 $tagger->expects($this->once())
134 ->method('tag');
135
558d9aab 136 $graby = $this->getMockBuilder('Graby\Graby')
4094ea47 137 ->setMethods(['fetchContent'])
558d9aab
JB
138 ->disableOriginalConstructor()
139 ->getMock();
140
141 $graby->expects($this->any())
142 ->method('fetchContent')
4094ea47 143 ->willReturn([
da3d4998 144 'html' => str_repeat('this is my content', 325),
558d9aab
JB
145 'title' => 'this is my title',
146 'url' => 'http://1.1.1.1',
147 'content_type' => 'text/html',
98f0929f 148 'language' => 'fr',
10b35097 149 'status' => '200',
4094ea47 150 'open_graph' => [
558d9aab
JB
151 'og_title' => 'my OG title',
152 'og_description' => 'OG desc',
f1e29e69 153 'og_image' => 'http://3.3.3.3/cover.jpg',
4094ea47
JB
154 ],
155 ]);
558d9aab 156
6bc6fb1f 157 $proxy = new ContentProxy($graby, $tagger, $this->getLogger(), $this->fetchingErrorMessage);
7aba665e
JC
158 $entry = new Entry(new User());
159 $proxy->updateEntry($entry, 'http://0.0.0.0');
558d9aab
JB
160
161 $this->assertEquals('http://1.1.1.1', $entry->getUrl());
162 $this->assertEquals('this is my title', $entry->getTitle());
da3d4998 163 $this->assertContains('this is my content', $entry->getContent());
558d9aab
JB
164 $this->assertEquals('http://3.3.3.3/cover.jpg', $entry->getPreviewPicture());
165 $this->assertEquals('text/html', $entry->getMimetype());
98f0929f 166 $this->assertEquals('fr', $entry->getLanguage());
10b35097 167 $this->assertEquals('200', $entry->getHttpStatus());
da3d4998
JB
168 $this->assertEquals(4.0, $entry->getReadingTime());
169 $this->assertEquals('1.1.1.1', $entry->getDomainName());
558d9aab 170 }
f530f7f5 171
3d71d403
JB
172 public function testWithContentAndNoOgImage()
173 {
174 $tagger = $this->getTaggerMock();
175 $tagger->expects($this->once())
176 ->method('tag');
177
178 $graby = $this->getMockBuilder('Graby\Graby')
179 ->setMethods(['fetchContent'])
180 ->disableOriginalConstructor()
181 ->getMock();
182
183 $graby->expects($this->any())
184 ->method('fetchContent')
185 ->willReturn([
186 'html' => str_repeat('this is my content', 325),
187 'title' => 'this is my title',
188 'url' => 'http://1.1.1.1',
189 'content_type' => 'text/html',
190 'language' => 'fr',
191 'status' => '200',
192 'open_graph' => [
193 'og_title' => 'my OG title',
194 'og_description' => 'OG desc',
195 'og_image' => false,
196 ],
197 ]);
198
6bc6fb1f 199 $proxy = new ContentProxy($graby, $tagger, $this->getLogger(), $this->fetchingErrorMessage);
3d71d403
JB
200 $entry = $proxy->updateEntry(new Entry(new User()), 'http://0.0.0.0');
201
202 $this->assertEquals('http://1.1.1.1', $entry->getUrl());
203 $this->assertEquals('this is my title', $entry->getTitle());
204 $this->assertContains('this is my content', $entry->getContent());
205 $this->assertNull($entry->getPreviewPicture());
206 $this->assertEquals('text/html', $entry->getMimetype());
207 $this->assertEquals('fr', $entry->getLanguage());
208 $this->assertEquals('200', $entry->getHttpStatus());
209 $this->assertEquals(4.0, $entry->getReadingTime());
210 $this->assertEquals('1.1.1.1', $entry->getDomainName());
211 }
212
4d0ec0e7
JB
213 public function testWithForcedContent()
214 {
215 $tagger = $this->getTaggerMock();
216 $tagger->expects($this->once())
217 ->method('tag');
218
0d6cfb88 219 $proxy = new ContentProxy((new Graby()), $tagger, $this->getLogger(), $this->fetchingErrorMessage);
7aba665e
JC
220 $entry = new Entry(new User());
221 $proxy->updateEntry(
222 $entry,
0d6cfb88
JB
223 'http://0.0.0.0',
224 [
225 'html' => str_repeat('this is my content', 325),
226 'title' => 'this is my title',
227 'url' => 'http://1.1.1.1',
228 'content_type' => 'text/html',
229 'language' => 'fr',
f0378b4d
JB
230 'date' => '1395635872',
231 'authors' => ['Jeremy', 'Nico', 'Thomas'],
232 'all_headers' => [
233 'Cache-Control' => 'no-cache',
38a04dee 234 ],
0d6cfb88
JB
235 ]
236 );
4d0ec0e7
JB
237
238 $this->assertEquals('http://1.1.1.1', $entry->getUrl());
239 $this->assertEquals('this is my title', $entry->getTitle());
240 $this->assertContains('this is my content', $entry->getContent());
241 $this->assertEquals('text/html', $entry->getMimetype());
242 $this->assertEquals('fr', $entry->getLanguage());
243 $this->assertEquals(4.0, $entry->getReadingTime());
244 $this->assertEquals('1.1.1.1', $entry->getDomainName());
f0378b4d
JB
245 $this->assertEquals('24/03/2014', $entry->getPublishedAt()->format('d/m/Y'));
246 $this->assertContains('Jeremy', $entry->getPublishedBy());
247 $this->assertContains('Nico', $entry->getPublishedBy());
248 $this->assertContains('Thomas', $entry->getPublishedBy());
249 $this->assertContains('no-cache', $entry->getHeaders());
250 }
251
252 public function testWithForcedContentAndDatetime()
253 {
254 $tagger = $this->getTaggerMock();
255 $tagger->expects($this->once())
256 ->method('tag');
257
695af588 258 $proxy = new ContentProxy((new Graby()), $tagger, $this->getLogger(), $this->fetchingErrorMessage);
7aba665e
JC
259 $entry = new Entry(new User());
260 $proxy->updateEntry(
261 $entry,
f0378b4d
JB
262 'http://0.0.0.0',
263 [
264 'html' => str_repeat('this is my content', 325),
265 'title' => 'this is my title',
266 'url' => 'http://1.1.1.1',
267 'content_type' => 'text/html',
268 'language' => 'fr',
269 'date' => '2016-09-08T11:55:58+0200',
270 ]
271 );
272
273 $this->assertEquals('http://1.1.1.1', $entry->getUrl());
274 $this->assertEquals('this is my title', $entry->getTitle());
275 $this->assertContains('this is my content', $entry->getContent());
276 $this->assertEquals('text/html', $entry->getMimetype());
277 $this->assertEquals('fr', $entry->getLanguage());
278 $this->assertEquals(4.0, $entry->getReadingTime());
279 $this->assertEquals('1.1.1.1', $entry->getDomainName());
280 $this->assertEquals('08/09/2016', $entry->getPublishedAt()->format('d/m/Y'));
281 }
282
283 public function testWithForcedContentAndBadDate()
284 {
285 $tagger = $this->getTaggerMock();
286 $tagger->expects($this->once())
287 ->method('tag');
288
289 $logger = new Logger('foo');
290 $handler = new TestHandler();
291 $logger->pushHandler($handler);
292
695af588 293 $proxy = new ContentProxy((new Graby()), $tagger, $logger, $this->fetchingErrorMessage);
7aba665e
JC
294 $entry = new Entry(new User());
295 $proxy->updateEntry(
296 $entry,
f0378b4d
JB
297 'http://0.0.0.0',
298 [
299 'html' => str_repeat('this is my content', 325),
300 'title' => 'this is my title',
301 'url' => 'http://1.1.1.1',
302 'content_type' => 'text/html',
303 'language' => 'fr',
304 'date' => '01 02 2012',
305 ]
306 );
307
308 $this->assertEquals('http://1.1.1.1', $entry->getUrl());
309 $this->assertEquals('this is my title', $entry->getTitle());
310 $this->assertContains('this is my content', $entry->getContent());
311 $this->assertEquals('text/html', $entry->getMimetype());
312 $this->assertEquals('fr', $entry->getLanguage());
313 $this->assertEquals(4.0, $entry->getReadingTime());
314 $this->assertEquals('1.1.1.1', $entry->getDomainName());
315 $this->assertNull($entry->getPublishedAt());
316
317 $records = $handler->getRecords();
318
319 $this->assertCount(1, $records);
320 $this->assertContains('Error while defining date', $records[0]['message']);
4d0ec0e7
JB
321 }
322
323 public function testTaggerThrowException()
324 {
325 $graby = $this->getMockBuilder('Graby\Graby')
326 ->disableOriginalConstructor()
327 ->getMock();
328
329 $tagger = $this->getTaggerMock();
330 $tagger->expects($this->once())
331 ->method('tag')
332 ->will($this->throwException(new \Exception()));
333
6bc6fb1f 334 $proxy = new ContentProxy($graby, $tagger, $this->getLogger(), $this->fetchingErrorMessage);
4d0ec0e7 335
7aba665e
JC
336 $entry = new Entry(new User());
337 $proxy->updateEntry($entry, 'http://0.0.0.0', [
4d0ec0e7
JB
338 'html' => str_repeat('this is my content', 325),
339 'title' => 'this is my title',
340 'url' => 'http://1.1.1.1',
341 'content_type' => 'text/html',
342 'language' => 'fr',
343 ]);
344
345 $this->assertCount(0, $entry->getTags());
346 }
347
74a75f7d
JB
348 public function dataForCrazyHtml()
349 {
350 return [
351 'script and comment' => [
352 '<strong>Script inside:</strong> <!--[if gte IE 4]><script>alert(\'lol\');</script><![endif]--><br />',
38a04dee 353 'lol',
74a75f7d
JB
354 ],
355 'script' => [
356 '<strong>Script inside:</strong><script>alert(\'lol\');</script>',
38a04dee 357 'script',
74a75f7d
JB
358 ],
359 ];
360 }
361
362 /**
363 * @dataProvider dataForCrazyHtml
364 */
365 public function testWithCrazyHtmlContent($html, $escapedString)
366 {
367 $tagger = $this->getTaggerMock();
368 $tagger->expects($this->once())
369 ->method('tag');
370
0d6cfb88 371 $proxy = new ContentProxy((new Graby()), $tagger, $this->getLogger(), $this->fetchingErrorMessage);
74a75f7d
JB
372 $entry = $proxy->updateEntry(
373 new Entry(new User()),
374 'http://1.1.1.1',
375 [
376 'html' => $html,
377 'title' => 'this is my title',
378 'url' => 'http://1.1.1.1',
379 'content_type' => 'text/html',
380 'language' => 'fr',
381 'status' => '200',
382 'open_graph' => [
383 'og_title' => 'my OG title',
384 'og_description' => 'OG desc',
385 'og_image' => 'http://3.3.3.3/cover.jpg',
386 ],
387 ]
388 );
389
390 $this->assertEquals('http://1.1.1.1', $entry->getUrl());
391 $this->assertEquals('this is my title', $entry->getTitle());
392 $this->assertNotContains($escapedString, $entry->getContent());
393 $this->assertEquals('http://3.3.3.3/cover.jpg', $entry->getPreviewPicture());
394 $this->assertEquals('text/html', $entry->getMimetype());
395 $this->assertEquals('fr', $entry->getLanguage());
396 $this->assertEquals('200', $entry->getHttpStatus());
397 $this->assertEquals('1.1.1.1', $entry->getDomainName());
398 }
399
f530f7f5
KG
400 private function getTaggerMock()
401 {
6bc6fb1f 402 return $this->getMockBuilder(RuleBasedTagger::class)
4094ea47 403 ->setMethods(['tag'])
f530f7f5
KG
404 ->disableOriginalConstructor()
405 ->getMock();
406 }
1c9cd2a7 407
0c5bcd82 408 private function getLogger()
1c9cd2a7 409 {
0c5bcd82 410 return new NullLogger();
1c9cd2a7 411 }
558d9aab 412}