stuff' . $title . ''; $this->assertEquals($title, html_extract_title($html)); $html = '' . $title . 'blablaanother'; $this->assertEquals($title, html_extract_title($html)); } /** * Test html_extract_title() when the title is not found. */ public function testHtmlExtractNonExistentTitle() { $html = 'stuff'; $this->assertFalse(html_extract_title($html)); } /** * Test headers_extract_charset() when the charset is found. */ public function testHeadersExtractExistentCharset() { $charset = 'x-MacCroatian'; $headers = 'text/html; charset=' . $charset; $this->assertEquals(strtolower($charset), header_extract_charset($headers)); } /** * Test headers_extract_charset() when the charset is found with odd quotes. */ public function testHeadersExtractExistentCharsetWithQuotes() { $charset = 'x-MacCroatian'; $headers = 'text/html; charset="' . $charset . '"otherstuff="test"'; $this->assertEquals(strtolower($charset), header_extract_charset($headers)); $headers = 'text/html; charset=\'' . $charset . '\'otherstuff="test"'; $this->assertEquals(strtolower($charset), header_extract_charset($headers)); } /** * Test headers_extract_charset() when the charset is not found. */ public function testHeadersExtractNonExistentCharset() { $headers = ''; $this->assertFalse(header_extract_charset($headers)); $headers = 'text/html'; $this->assertFalse(header_extract_charset($headers)); } /** * Test html_extract_charset() when the charset is found. */ public function testHtmlExtractExistentCharset() { $charset = 'x-MacCroatian'; $html = 'stuff2'; $this->assertEquals(strtolower($charset), html_extract_charset($html)); } /** * Test html_extract_charset() when the charset is not found. */ public function testHtmlExtractNonExistentCharset() { $html = 'stuff'; $this->assertFalse(html_extract_charset($html)); $html = 'stuff'; $this->assertFalse(html_extract_charset($html)); } /** * Test html_extract_tag() when the tag '; $this->assertEquals($description, html_extract_tag('description', $html)); // Simple OpenGraph $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // Simple reversed OpenGraph $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // ItemProp OpenGraph $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // OpenGraph without quotes $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // OpenGraph reversed without quotes $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // OpenGraph with noise $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // OpenGraph reversed with noise $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // OpenGraph multiple properties start $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // OpenGraph multiple properties end $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // OpenGraph multiple properties both end $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // OpenGraph multiple properties both end with noise $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // OpenGraph reversed multiple properties start $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // OpenGraph reversed multiple properties end $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // OpenGraph reversed multiple properties both end $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // OpenGraph reversed multiple properties both end with noise $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); // Suggestion from #1375 $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); } /** * Test html_extract_tag() with double quoted content containing single quote, and the opposite. */ public function testHtmlExtractExistentNameTagWithMixedQuotes(): void { $description = 'Bob and Alice share M&M\'s.'; $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); $description = 'Bob and Alice share "cookies".'; $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); $html = ''; $this->assertEquals($description, html_extract_tag('description', $html)); } /** * Test html_extract_tag() when the tag assertFalse(html_extract_tag('description', $html)); // Partial meta tag $html = ''; $this->assertFalse(html_extract_tag('description', $html)); $html = ''; $this->assertFalse(html_extract_tag('description', $html)); $html = ''; $this->assertFalse(html_extract_tag('description', $html)); $html = ''; $this->assertFalse(html_extract_tag('description', $html)); $html = ''; $this->assertFalse(html_extract_tag('description', $html)); $html = ''; $this->assertFalse(html_extract_tag('description', $html)); } /** * Test html_extract_tag() when the tag '; $this->assertEquals($description, html_extract_tag('description', $html)); } /** * Test html_extract_tag() when the tag '; $this->assertFalse(html_extract_tag('description', $html)); } public function testHtmlExtractDescriptionFromGoogleRealCase(): void { $html = 'id="gsr">'. ''. 'assertSame('Bonnes fêtes de fin d\'année ! #GoogleDoodle', html_extract_tag('description', $html)); } /** * Test the header callback with valid value */ public function testCurlHeaderCallbackOk(): void { $callback = get_curl_header_callback($charset, 'ut_curl_getinfo_ok'); $data = [ 'HTTP/1.1 200 OK', 'Server: GitHub.com', 'Date: Sat, 28 Oct 2017 12:01:33 GMT', 'Content-Type: text/html; charset=utf-8', 'Status: 200 OK', ]; foreach ($data as $chunk) { static::assertIsInt($callback(null, $chunk)); } static::assertSame('utf-8', $charset); } /** * Test the download callback with valid value */ public function testCurlDownloadCallbackOk(): void { $charset = 'utf-8'; $callback = get_curl_download_callback( $charset, $title, $desc, $keywords, false, ' ' ); $data = [ 'th=device-width">' . 'Refactoring · GitHub' . '' . '', ]; foreach ($data as $chunk) { static::assertSame(strlen($chunk), $callback(null, $chunk)); } static::assertSame('utf-8', $charset); static::assertSame('Refactoring · GitHub', $title); static::assertEmpty($desc); static::assertEmpty($keywords); } /** * Test the header callback with valid value */ public function testCurlHeaderCallbackNoCharset(): void { $callback = get_curl_header_callback($charset, 'ut_curl_getinfo_no_charset'); $data = [ 'HTTP/1.1 200 OK', ]; foreach ($data as $chunk) { static::assertSame(strlen($chunk), $callback(null, $chunk)); } static::assertFalse($charset); } /** * Test the download callback with valid values and no charset */ public function testCurlDownloadCallbackOkNoCharset(): void { $charset = null; $callback = get_curl_download_callback( $charset, $title, $desc, $keywords, false, ' ' ); $data = [ 'end' => 'th=device-width">' . 'Refactoring · GitHub' . '' . '', ]; foreach ($data as $chunk) { static::assertSame(strlen($chunk), $callback(null, $chunk)); } $this->assertEmpty($charset); $this->assertEquals('Refactoring · GitHub', $title); $this->assertEmpty($desc); $this->assertEmpty($keywords); } /** * Test the download callback with valid values and no charset */ public function testCurlDownloadCallbackOkHtmlCharset(): void { $charset = null; $callback = get_curl_download_callback( $charset, $title, $desc, $keywords, false, ' ' ); $data = [ '', 'end' => 'th=device-width">' . 'Refactoring · GitHub' . '' . '', ]; foreach ($data as $chunk) { static::assertSame(strlen($chunk), $callback(null, $chunk)); } $this->assertEquals('utf-8', $charset); $this->assertEquals('Refactoring · GitHub', $title); $this->assertEmpty($desc); $this->assertEmpty($keywords); } /** * Test the download callback with valid values and no title */ public function testCurlDownloadCallbackOkNoTitle(): void { $charset = 'utf-8'; $callback = get_curl_download_callback( $charset, $title, $desc, $keywords, false, ' ' ); $data = [ 'end' => 'th=device-width">Refactoring · GitHub' . 'Refactoring · GitHub' . '' . '', ]; foreach ($data as $chunk) { static::assertSame(strlen($chunk), $callback(null, $chunk)); } $this->assertEquals('utf-8', $charset); $this->assertEquals('Refactoring · GitHub', $title); $this->assertEquals('link desc', $desc); $this->assertEquals('key1 key2', $keywords); } /** * Test the download callback with valid value, and retrieve_description option enabled, * but no desc or keyword defined in the page. */ public function testCurlDownloadCallbackOkWithDescNotFound(): void { $charset = 'utf-8'; $callback = get_curl_download_callback( $charset, $title, $desc, $keywords, true, 'ut_curl_getinfo_ok' ); $data = [ 'th=device-width">' . 'Refactoring · GitHub' . '' . 'http://hello.there/is=someone#here otherstuff'; $processedText = text2clickable($text); $this->assertEquals($expectedText, $processedText); $text = 'stuff http://hello.there/is=someone#here(please) otherstuff'; $expectedText = 'stuff ' . 'http://hello.there/is=someone#here(please) otherstuff'; $processedText = text2clickable($text); $this->assertEquals($expectedText, $processedText); $text = 'stuff http://hello.there/is=someone#here(please)&no otherstuff'; $text = 'stuff http://hello.there/is=someone#here(please)&no otherstuff'; $expectedText = 'stuff ' . 'http://hello.there/is=someone#here(please)&no otherstuff'; $processedText = text2clickable($text); $this->assertEquals($expectedText, $processedText); } /** * Test testSpace2nbsp. */ public function testSpace2nbsp() { $text = ' Are you thrilled by flags ?' . PHP_EOL . ' Really?'; $expectedText = '  Are you   thrilled  by flags   ?' . PHP_EOL . ' Really?'; $processedText = space2nbsp($text); $this->assertEquals($expectedText, $processedText); } /** * Test hashtags auto-link. */ public function testHashtagAutolink() { $index = 'http://domain.tld/'; $rawDescription = '#hashtag\n # nothashtag\n test#nothashtag #hashtag \#nothashtag\n test #hashtag #hashtag test #hashtag.test\n #hashtag #hashtag-nothashtag #hashtag_hashtag\n What is #ашок anyway?\n カタカナ #カタカナ」カタカナ\n'; $autolinkedDescription = hashtag_autolink($rawDescription, $index); $this->assertContainsPolyfill($this->getHashtagLink('hashtag', $index), $autolinkedDescription); $this->assertNotContainsPolyfill(' #hashtag', $autolinkedDescription); $this->assertNotContainsPolyfill('>#nothashtag', $autolinkedDescription); $this->assertContainsPolyfill($this->getHashtagLink('ашок', $index), $autolinkedDescription); $this->assertContainsPolyfill($this->getHashtagLink('カタカナ', $index), $autolinkedDescription); $this->assertContainsPolyfill($this->getHashtagLink('hashtag_hashtag', $index), $autolinkedDescription); $this->assertNotContainsPolyfill($this->getHashtagLink('hashtag-nothashtag', $index), $autolinkedDescription); } /** * Test hashtags auto-link without index URL. */ public function testHashtagAutolinkNoIndex() { $rawDescription = 'blabla #hashtag x#nothashtag'; $autolinkedDescription = hashtag_autolink($rawDescription); $this->assertContainsPolyfill($this->getHashtagLink('hashtag'), $autolinkedDescription); $this->assertNotContainsPolyfill(' #hashtag', $autolinkedDescription); $this->assertNotContainsPolyfill('>#nothashtag', $autolinkedDescription); } /** * Test is_note with note URLs. */ public function testIsNote() { $this->assertTrue(is_note('?')); $this->assertTrue(is_note('?abcDEf')); $this->assertTrue(is_note('?_abcDEf#123')); } /** * Test is_note with non note URLs. */ public function testIsNotNote() { $this->assertFalse(is_note('')); $this->assertFalse(is_note('nope')); $this->assertFalse(is_note('https://github.com/shaarli/Shaarli/?hi')); } /** * Test tags_str2array with whitespace separator. */ public function testTagsStr2ArrayWithSpaceSeparator(): void { $separator = ' '; static::assertSame(['tag1', 'tag2', 'tag3'], tags_str2array('tag1 tag2 tag3', $separator)); static::assertSame(['tag1', 'tag2', 'tag3'], tags_str2array('tag1 tag2 tag3', $separator)); static::assertSame(['tag1', 'tag2', 'tag3'], tags_str2array(' tag1 tag2 tag3 ', $separator)); static::assertSame(['tag1@', 'tag2,', '.tag3'], tags_str2array(' tag1@ tag2, .tag3 ', $separator)); static::assertSame([], tags_str2array('', $separator)); static::assertSame([], tags_str2array(' ', $separator)); static::assertSame([], tags_str2array(null, $separator)); } /** * Test tags_str2array with @ separator. */ public function testTagsStr2ArrayWithCharSeparator(): void { $separator = '@'; static::assertSame(['tag1', 'tag2', 'tag3'], tags_str2array('tag1@tag2@tag3', $separator)); static::assertSame(['tag1', 'tag2', 'tag3'], tags_str2array('tag1@@@@tag2@@@@tag3', $separator)); static::assertSame(['tag1', 'tag2', 'tag3'], tags_str2array('@@@tag1@@@tag2@@@@tag3@@', $separator)); static::assertSame( ['tag1#', 'tag2, and other', '.tag3'], tags_str2array('@@@ tag1# @@@ tag2, and other @@@@.tag3@@', $separator) ); static::assertSame([], tags_str2array('', $separator)); static::assertSame([], tags_str2array(' ', $separator)); static::assertSame([], tags_str2array(null, $separator)); } /** * Test tags_array2str with ' ' separator. */ public function testTagsArray2StrWithSpaceSeparator(): void { $separator = ' '; static::assertSame('tag1 tag2 tag3', tags_array2str(['tag1', 'tag2', 'tag3'], $separator)); static::assertSame('tag1, tag2@ tag3', tags_array2str(['tag1,', 'tag2@', 'tag3'], $separator)); static::assertSame('tag1 tag2 tag3', tags_array2str([' tag1 ', 'tag2', 'tag3 '], $separator)); static::assertSame('tag1 tag2 tag3', tags_array2str([' tag1 ', ' ', 'tag2', ' ', 'tag3 '], $separator)); static::assertSame('tag1', tags_array2str([' tag1 '], $separator)); static::assertSame('', tags_array2str([' '], $separator)); static::assertSame('', tags_array2str([], $separator)); static::assertSame('', tags_array2str(null, $separator)); } /** * Test tags_array2str with @ separator. */ public function testTagsArray2StrWithCharSeparator(): void { $separator = '@'; static::assertSame('tag1@tag2@tag3', tags_array2str(['tag1', 'tag2', 'tag3'], $separator)); static::assertSame('tag1,@tag2@tag3', tags_array2str(['tag1,', 'tag2@', 'tag3'], $separator)); static::assertSame( 'tag1@tag2, and other@tag3', tags_array2str(['@@@@ tag1@@@', ' @tag2, and other @', 'tag3@@@@'], $separator) ); static::assertSame('tag1@tag2@tag3', tags_array2str(['@@@tag1@@@', '@', 'tag2', '@@@', 'tag3@@@'], $separator)); static::assertSame('tag1', tags_array2str(['@@@@tag1@@@@'], $separator)); static::assertSame('', tags_array2str(['@@@'], $separator)); static::assertSame('', tags_array2str([], $separator)); static::assertSame('', tags_array2str(null, $separator)); } /** * Test tags_array2str with @ separator. */ public function testTagsFilterWithSpaceSeparator(): void { $separator = ' '; static::assertSame(['tag1', 'tag2', 'tag3'], tags_filter(['tag1', 'tag2', 'tag3'], $separator)); static::assertSame(['tag1,', 'tag2@', 'tag3'], tags_filter(['tag1,', 'tag2@', 'tag3'], $separator)); static::assertSame(['tag1', 'tag2', 'tag3'], tags_filter([' tag1 ', 'tag2', 'tag3 '], $separator)); static::assertSame(['tag1', 'tag2', 'tag3'], tags_filter([' tag1 ', ' ', 'tag2', ' ', 'tag3 '], $separator)); static::assertSame(['tag1'], tags_filter([' tag1 '], $separator)); static::assertSame([], tags_filter([' '], $separator)); static::assertSame([], tags_filter([], $separator)); static::assertSame([], tags_filter(null, $separator)); } /** * Test tags_array2str with @ separator. */ public function testTagsArrayFilterWithSpaceSeparator(): void { $separator = '@'; static::assertSame(['tag1', 'tag2', 'tag3'], tags_filter(['tag1', 'tag2', 'tag3'], $separator)); static::assertSame(['tag1,', 'tag2#', 'tag3'], tags_filter(['tag1,', 'tag2#', 'tag3'], $separator)); static::assertSame( ['tag1', 'tag2, and other', 'tag3'], tags_filter(['@@@@ tag1@@@', ' @tag2, and other @', 'tag3@@@@'], $separator) ); static::assertSame(['tag1', 'tag2', 'tag3'], tags_filter(['@@@tag1@@@', '@', 'tag2', '@@@', 'tag3@@@'], $separator)); static::assertSame(['tag1'], tags_filter(['@@@@tag1@@@@'], $separator)); static::assertSame([], tags_filter(['@@@'], $separator)); static::assertSame([], tags_filter([], $separator)); static::assertSame([], tags_filter(null, $separator)); } /** * Util function to build an hashtag link. * * @param string $hashtag Hashtag name. * @param string $index Index URL. * * @return string HTML hashtag link. */ private function getHashtagLink($hashtag, $index = '') { $hashtagLink = '#$1'; return str_replace('$1', $hashtag, $hashtagLink); } }