3 namespace Tests\Wallabag\CoreBundle\Helper
;
6 use Monolog\Handler\TestHandler
;
8 use Psr\Log\NullLogger
;
9 use Symfony\Component\Validator\ConstraintViolation
;
10 use Symfony\Component\Validator\ConstraintViolationList
;
11 use Symfony\Component\Validator\Validator\RecursiveValidator
;
12 use Wallabag\CoreBundle\Entity\Entry
;
13 use Wallabag\CoreBundle\Entity\Tag
;
14 use Wallabag\CoreBundle\Helper\ContentProxy
;
15 use Wallabag\CoreBundle\Helper\RuleBasedTagger
;
16 use Wallabag\UserBundle\Entity\User
;
18 class ContentProxyTest
extends \PHPUnit_Framework_TestCase
20 private $fetchingErrorMessage = 'wallabag can\'t retrieve contents for this article. Please <a href="http://doc.wallabag.org/en/user/errors_during_fetching.html#how-can-i-help-to-fix-that">troubleshoot this issue</a>.';
22 public function testWithBadUrl()
24 $tagger = $this->getTaggerMock();
25 $tagger->expects($this->once())
28 $graby = $this->getMockBuilder('Graby\Graby')
29 ->setMethods(['fetchContent'])
30 ->disableOriginalConstructor()
33 $graby->expects($this->any())
34 ->method('fetchContent')
43 $proxy = new ContentProxy($graby, $tagger, $this->getValidator(), $this->getLogger(), $this->fetchingErrorMessage
);
44 $entry = new Entry(new User());
45 $proxy->updateEntry($entry, 'http://user@:80');
47 $this->assertSame('http://user@:80', $entry->getUrl());
48 $this->assertEmpty($entry->getTitle());
49 $this->assertSame($this->fetchingErrorMessage
, $entry->getContent());
50 $this->assertEmpty($entry->getPreviewPicture());
51 $this->assertEmpty($entry->getMimetype());
52 $this->assertEmpty($entry->getLanguage());
53 $this->assertSame(0.0, $entry->getReadingTime());
54 $this->assertNull($entry->getDomainName());
57 public function testWithEmptyContent()
59 $tagger = $this->getTaggerMock();
60 $tagger->expects($this->once())
63 $graby = $this->getMockBuilder('Graby\Graby')
64 ->setMethods(['fetchContent'])
65 ->disableOriginalConstructor()
68 $graby->expects($this->any())
69 ->method('fetchContent')
78 $proxy = new ContentProxy($graby, $tagger, $this->getValidator(), $this->getLogger(), $this->fetchingErrorMessage
);
79 $entry = new Entry(new User());
80 $proxy->updateEntry($entry, 'http://0.0.0.0');
82 $this->assertSame('http://0.0.0.0', $entry->getUrl());
83 $this->assertEmpty($entry->getTitle());
84 $this->assertSame($this->fetchingErrorMessage
, $entry->getContent());
85 $this->assertEmpty($entry->getPreviewPicture());
86 $this->assertEmpty($entry->getMimetype());
87 $this->assertEmpty($entry->getLanguage());
88 $this->assertSame(0.0, $entry->getReadingTime());
89 $this->assertSame('0.0.0.0', $entry->getDomainName());
92 public function testWithEmptyContentButOG()
94 $tagger = $this->getTaggerMock();
95 $tagger->expects($this->once())
98 $graby = $this->getMockBuilder('Graby\Graby')
99 ->setMethods(['fetchContent'])
100 ->disableOriginalConstructor()
103 $graby->expects($this->any())
104 ->method('fetchContent')
109 'content_type' => '',
113 'og_title' => 'my title',
114 'og_description' => 'desc',
118 $proxy = new ContentProxy($graby, $tagger, $this->getValidator(), $this->getLogger(), $this->fetchingErrorMessage
);
119 $entry = new Entry(new User());
120 $proxy->updateEntry($entry, 'http://domain.io');
122 $this->assertSame('http://domain.io', $entry->getUrl());
123 $this->assertSame('my title', $entry->getTitle());
124 $this->assertSame($this->fetchingErrorMessage
. '<p><i>But we found a short description: </i></p>desc', $entry->getContent());
125 $this->assertEmpty($entry->getPreviewPicture());
126 $this->assertEmpty($entry->getLanguage());
127 $this->assertEmpty($entry->getHttpStatus());
128 $this->assertEmpty($entry->getMimetype());
129 $this->assertSame(0.0, $entry->getReadingTime());
130 $this->assertSame('domain.io', $entry->getDomainName());
133 public function testWithContent()
135 $tagger = $this->getTaggerMock();
136 $tagger->expects($this->once())
139 $graby = $this->getMockBuilder('Graby\Graby')
140 ->setMethods(['fetchContent'])
141 ->disableOriginalConstructor()
144 $graby->expects($this->any())
145 ->method('fetchContent')
147 'html' => str_repeat('this is my content', 325),
148 'title' => 'this is my title',
149 'url' => 'http://1.1.1.1',
150 'content_type' => 'text/html',
154 'og_title' => 'my OG title',
155 'og_description' => 'OG desc',
156 'og_image' => 'http://3.3.3.3/cover.jpg',
160 $proxy = new ContentProxy($graby, $tagger, $this->getValidator(), $this->getLogger(), $this->fetchingErrorMessage
);
161 $entry = new Entry(new User());
162 $proxy->updateEntry($entry, 'http://0.0.0.0');
164 $this->assertSame('http://1.1.1.1', $entry->getUrl());
165 $this->assertSame('this is my title', $entry->getTitle());
166 $this->assertContains('this is my content', $entry->getContent());
167 $this->assertSame('http://3.3.3.3/cover.jpg', $entry->getPreviewPicture());
168 $this->assertSame('text/html', $entry->getMimetype());
169 $this->assertSame('fr', $entry->getLanguage());
170 $this->assertSame('200', $entry->getHttpStatus());
171 $this->assertSame(4.0, $entry->getReadingTime());
172 $this->assertSame('1.1.1.1', $entry->getDomainName());
175 public function testWithContentAndNoOgImage()
177 $tagger = $this->getTaggerMock();
178 $tagger->expects($this->once())
181 $graby = $this->getMockBuilder('Graby\Graby')
182 ->setMethods(['fetchContent'])
183 ->disableOriginalConstructor()
186 $graby->expects($this->any())
187 ->method('fetchContent')
189 'html' => str_repeat('this is my content', 325),
190 'title' => 'this is my title',
191 'url' => 'http://1.1.1.1',
192 'content_type' => 'text/html',
196 'og_title' => 'my OG title',
197 'og_description' => 'OG desc',
202 $proxy = new ContentProxy($graby, $tagger, $this->getValidator(), $this->getLogger(), $this->fetchingErrorMessage
);
203 $entry = new Entry(new User());
204 $proxy->updateEntry($entry, 'http://0.0.0.0');
206 $this->assertSame('http://1.1.1.1', $entry->getUrl());
207 $this->assertSame('this is my title', $entry->getTitle());
208 $this->assertContains('this is my content', $entry->getContent());
209 $this->assertNull($entry->getPreviewPicture());
210 $this->assertSame('text/html', $entry->getMimetype());
211 $this->assertSame('fr', $entry->getLanguage());
212 $this->assertSame('200', $entry->getHttpStatus());
213 $this->assertSame(4.0, $entry->getReadingTime());
214 $this->assertSame('1.1.1.1', $entry->getDomainName());
217 public function testWithContentAndBadLanguage()
219 $tagger = $this->getTaggerMock();
220 $tagger->expects($this->once())
223 $validator = $this->getValidator();
224 $validator->expects($this->once())
226 ->willReturn(new ConstraintViolationList([new ConstraintViolation('oops', 'oops', [], 'oops', 'language', 'dontexist')]));
228 $graby = $this->getMockBuilder('Graby\Graby')
229 ->setMethods(['fetchContent'])
230 ->disableOriginalConstructor()
233 $graby->expects($this->any())
234 ->method('fetchContent')
236 'html' => str_repeat('this is my content', 325),
237 'title' => 'this is my title',
238 'url' => 'http://1.1.1.1',
239 'content_type' => 'text/html',
240 'language' => 'dontexist',
244 $proxy = new ContentProxy($graby, $tagger, $validator, $this->getLogger(), $this->fetchingErrorMessage
);
245 $entry = new Entry(new User());
246 $proxy->updateEntry($entry, 'http://0.0.0.0');
248 $this->assertSame('http://1.1.1.1', $entry->getUrl());
249 $this->assertSame('this is my title', $entry->getTitle());
250 $this->assertContains('this is my content', $entry->getContent());
251 $this->assertSame('text/html', $entry->getMimetype());
252 $this->assertNull($entry->getLanguage());
253 $this->assertSame('200', $entry->getHttpStatus());
254 $this->assertSame(4.0, $entry->getReadingTime());
255 $this->assertSame('1.1.1.1', $entry->getDomainName());
258 public function testWithContentAndBadOgImage()
260 $tagger = $this->getTaggerMock();
261 $tagger->expects($this->once())
264 $validator = $this->getValidator();
265 $validator->expects($this->exactly(2))
267 ->will($this->onConsecutiveCalls(
268 new ConstraintViolationList(),
269 new ConstraintViolationList([new ConstraintViolation('oops', 'oops', [], 'oops', 'url', 'https://')])
272 $graby = $this->getMockBuilder('Graby\Graby')
273 ->setMethods(['fetchContent'])
274 ->disableOriginalConstructor()
277 $graby->expects($this->any())
278 ->method('fetchContent')
280 'html' => str_repeat('this is my content', 325),
281 'title' => 'this is my title',
282 'url' => 'http://1.1.1.1',
283 'content_type' => 'text/html',
287 'og_title' => 'my OG title',
288 'og_description' => 'OG desc',
289 'og_image' => 'https://',
293 $proxy = new ContentProxy($graby, $tagger, $validator, $this->getLogger(), $this->fetchingErrorMessage
);
294 $entry = new Entry(new User());
295 $proxy->updateEntry($entry, 'http://0.0.0.0');
297 $this->assertSame('http://1.1.1.1', $entry->getUrl());
298 $this->assertSame('this is my title', $entry->getTitle());
299 $this->assertContains('this is my content', $entry->getContent());
300 $this->assertNull($entry->getPreviewPicture());
301 $this->assertSame('text/html', $entry->getMimetype());
302 $this->assertSame('fr', $entry->getLanguage());
303 $this->assertSame('200', $entry->getHttpStatus());
304 $this->assertSame(4.0, $entry->getReadingTime());
305 $this->assertSame('1.1.1.1', $entry->getDomainName());
308 public function testWithForcedContent()
310 $tagger = $this->getTaggerMock();
311 $tagger->expects($this->once())
314 $proxy = new ContentProxy((new Graby()), $tagger, $this->getValidator(), $this->getLogger(), $this->fetchingErrorMessage
, true);
315 $entry = new Entry(new User());
320 'html' => str_repeat('this is my content', 325),
321 'title' => 'this is my title',
322 'url' => 'http://1.1.1.1',
323 'content_type' => 'text/html',
325 'date' => '1395635872',
326 'authors' => ['Jeremy', 'Nico', 'Thomas'],
328 'Cache-Control' => 'no-cache',
333 $this->assertSame('http://1.1.1.1', $entry->getUrl());
334 $this->assertSame('this is my title', $entry->getTitle());
335 $this->assertContains('this is my content', $entry->getContent());
336 $this->assertSame('text/html', $entry->getMimetype());
337 $this->assertSame('fr', $entry->getLanguage());
338 $this->assertSame(4.0, $entry->getReadingTime());
339 $this->assertSame('1.1.1.1', $entry->getDomainName());
340 $this->assertSame('24/03/2014', $entry->getPublishedAt()->format('d/m/Y'));
341 $this->assertContains('Jeremy', $entry->getPublishedBy());
342 $this->assertContains('Nico', $entry->getPublishedBy());
343 $this->assertContains('Thomas', $entry->getPublishedBy());
344 $this->assertNotNull($entry->getHeaders(), 'Headers are stored, so value is not null');
345 $this->assertContains('no-cache', $entry->getHeaders());
348 public function testWithForcedContentAndDatetime()
350 $tagger = $this->getTaggerMock();
351 $tagger->expects($this->once())
354 $logHandler = new TestHandler();
355 $logger = new Logger('test', [$logHandler]);
357 $proxy = new ContentProxy((new Graby()), $tagger, $this->getValidator(), $logger, $this->fetchingErrorMessage
);
358 $entry = new Entry(new User());
363 'html' => str_repeat('this is my content', 325),
364 'title' => 'this is my title',
365 'url' => 'http://1.1.1.1',
366 'content_type' => 'text/html',
368 'date' => '2016-09-08T11:55:58+0200',
372 $this->assertSame('http://1.1.1.1', $entry->getUrl());
373 $this->assertSame('this is my title', $entry->getTitle());
374 $this->assertContains('this is my content', $entry->getContent());
375 $this->assertSame('text/html', $entry->getMimetype());
376 $this->assertSame('fr', $entry->getLanguage());
377 $this->assertSame(4.0, $entry->getReadingTime());
378 $this->assertSame('1.1.1.1', $entry->getDomainName());
379 $this->assertSame('08/09/2016', $entry->getPublishedAt()->format('d/m/Y'));
382 public function testWithForcedContentAndBadDate()
384 $tagger = $this->getTaggerMock();
385 $tagger->expects($this->once())
388 $logger = new Logger('foo');
389 $handler = new TestHandler();
390 $logger->pushHandler($handler);
392 $proxy = new ContentProxy((new Graby()), $tagger, $this->getValidator(), $logger, $this->fetchingErrorMessage
);
393 $entry = new Entry(new User());
398 'html' => str_repeat('this is my content', 325),
399 'title' => 'this is my title',
400 'url' => 'http://1.1.1.1',
401 'content_type' => 'text/html',
403 'date' => '01 02 2012',
407 $this->assertSame('http://1.1.1.1', $entry->getUrl());
408 $this->assertSame('this is my title', $entry->getTitle());
409 $this->assertContains('this is my content', $entry->getContent());
410 $this->assertSame('text/html', $entry->getMimetype());
411 $this->assertSame('fr', $entry->getLanguage());
412 $this->assertSame(4.0, $entry->getReadingTime());
413 $this->assertSame('1.1.1.1', $entry->getDomainName());
414 $this->assertNull($entry->getPublishedAt());
416 $records = $handler->getRecords();
418 $this->assertCount(1, $records);
419 $this->assertContains('Error while defining date', $records[0]['message']);
422 public function testTaggerThrowException()
424 $tagger = $this->getTaggerMock();
425 $tagger->expects($this->once())
427 ->will($this->throwException(new \
Exception()));
429 $proxy = new ContentProxy((new Graby()), $tagger, $this->getValidator(), $this->getLogger(), $this->fetchingErrorMessage
);
430 $entry = new Entry(new User());
435 'html' => str_repeat('this is my content', 325),
436 'title' => 'this is my title',
437 'url' => 'http://1.1.1.1',
438 'content_type' => 'text/html',
443 $this->assertCount(0, $entry->getTags());
446 public function dataForCrazyHtml()
449 'script and comment' => [
450 '<strong>Script inside:</strong> <!--[if gte IE 4]><script>alert(\'lol\');</script><![endif]--><br />',
454 '<strong>Script inside:</strong><script>alert(\'lol\');</script>',
461 * @dataProvider dataForCrazyHtml
463 public function testWithCrazyHtmlContent($html, $escapedString)
465 $tagger = $this->getTaggerMock();
466 $tagger->expects($this->once())
469 $proxy = new ContentProxy((new Graby()), $tagger, $this->getValidator(), $this->getLogger(), $this->fetchingErrorMessage
);
470 $entry = new Entry(new User());
476 'title' => 'this is my title',
477 'url' => 'http://1.1.1.1',
478 'content_type' => 'text/html',
482 'og_title' => 'my OG title',
483 'og_description' => 'OG desc',
484 'og_image' => 'http://3.3.3.3/cover.jpg',
489 $this->assertSame('http://1.1.1.1', $entry->getUrl());
490 $this->assertSame('this is my title', $entry->getTitle());
491 $this->assertNotContains($escapedString, $entry->getContent());
492 $this->assertSame('http://3.3.3.3/cover.jpg', $entry->getPreviewPicture());
493 $this->assertSame('text/html', $entry->getMimetype());
494 $this->assertSame('fr', $entry->getLanguage());
495 $this->assertSame('200', $entry->getHttpStatus());
496 $this->assertSame('1.1.1.1', $entry->getDomainName());
499 public function testWithImageAsContent()
501 $tagger = $this->getTaggerMock();
502 $tagger->expects($this->once())
505 $graby = $this->getMockBuilder('Graby\Graby')
506 ->setMethods(['fetchContent'])
507 ->disableOriginalConstructor()
510 $graby->expects($this->any())
511 ->method('fetchContent')
513 'html' => '<p><img src="http://1.1.1.1/image.jpg" /></p>',
514 'title' => 'this is my title',
515 'url' => 'http://1.1.1.1/image.jpg',
516 'content_type' => 'image/jpeg',
521 $proxy = new ContentProxy($graby, $tagger, $this->getValidator(), $this->getLogger(), $this->fetchingErrorMessage
);
522 $entry = new Entry(new User());
523 $proxy->updateEntry($entry, 'http://0.0.0.0');
525 $this->assertSame('http://1.1.1.1/image.jpg', $entry->getUrl());
526 $this->assertSame('this is my title', $entry->getTitle());
527 $this->assertContains('http://1.1.1.1/image.jpg', $entry->getContent());
528 $this->assertSame('http://1.1.1.1/image.jpg', $entry->getPreviewPicture());
529 $this->assertSame('image/jpeg', $entry->getMimetype());
530 $this->assertSame('200', $entry->getHttpStatus());
531 $this->assertSame('1.1.1.1', $entry->getDomainName());
534 private function getTaggerMock()
536 return $this->getMockBuilder(RuleBasedTagger
::class)
537 ->setMethods(['tag'])
538 ->disableOriginalConstructor()
542 private function getLogger()
544 return new NullLogger();
547 private function getValidator()
549 return $this->getMockBuilder(RecursiveValidator
::class)
550 ->setMethods(['validate'])
551 ->disableOriginalConstructor()