2015-09-10 21:57:25 +02:00
< ? php
2016-12-03 15:44:34 +01:00
namespace Tests\Wallabag\CoreBundle\Helper ;
2015-09-10 21:57:25 +02:00
2015-10-31 16:38:49 +01:00
use Psr\Log\NullLogger ;
2015-09-10 21:57:25 +02:00
use Wallabag\CoreBundle\Helper\ContentProxy ;
2016-02-19 14:22:20 +01:00
use Wallabag\CoreBundle\Entity\Entry ;
use Wallabag\CoreBundle\Entity\Tag ;
2015-12-22 10:16:34 +01:00
use Wallabag\UserBundle\Entity\User ;
2017-05-27 22:08:14 +02:00
use Wallabag\CoreBundle\Helper\RuleBasedTagger ;
2017-05-12 07:53:21 +02:00
use Graby\Graby ;
2015-09-10 21:57:25 +02:00
2016-12-03 15:44:34 +01:00
class ContentProxyTest extends \PHPUnit_Framework_TestCase
2015-09-10 21:57:25 +02:00
{
2017-05-24 12:57:46 +02:00
private $fetchingErrorMessage = 'wallabag can\'t retrieve contents for this article. Please <a href="http://doc.wallabag.org/en/user/errors_during_fetching.html#how-can-i-help-to-fix-that">troubleshoot this issue</a>.' ;
2016-12-03 15:44:34 +01:00
2016-03-27 20:35:56 +02:00
public function testWithBadUrl ()
{
$tagger = $this -> getTaggerMock ();
$tagger -> expects ( $this -> once ())
-> method ( 'tag' );
$graby = $this -> getMockBuilder ( 'Graby\Graby' )
2016-04-12 11:36:01 +02:00
-> setMethods ([ 'fetchContent' ])
2016-03-27 20:35:56 +02:00
-> disableOriginalConstructor ()
-> getMock ();
$graby -> expects ( $this -> any ())
-> method ( 'fetchContent' )
2016-04-12 11:36:01 +02:00
-> willReturn ([
2016-03-27 20:35:56 +02:00
'html' => false ,
'title' => '' ,
'url' => '' ,
'content_type' => '' ,
'language' => '' ,
2016-04-12 11:36:01 +02:00
]);
2016-03-27 20:35:56 +02:00
2017-05-27 22:08:14 +02:00
$proxy = new ContentProxy ( $graby , $tagger , $this -> getLogger (), $this -> fetchingErrorMessage );
2016-03-27 20:35:56 +02:00
$entry = $proxy -> updateEntry ( new Entry ( new User ()), 'http://user@:80' );
$this -> assertEquals ( 'http://user@:80' , $entry -> getUrl ());
$this -> assertEmpty ( $entry -> getTitle ());
2016-12-03 05:59:18 +01:00
$this -> assertEquals ( $this -> fetchingErrorMessage , $entry -> getContent ());
2016-03-27 20:35:56 +02:00
$this -> assertEmpty ( $entry -> getPreviewPicture ());
$this -> assertEmpty ( $entry -> getMimetype ());
$this -> assertEmpty ( $entry -> getLanguage ());
$this -> assertEquals ( 0.0 , $entry -> getReadingTime ());
$this -> assertEquals ( false , $entry -> getDomainName ());
}
2015-09-10 21:57:25 +02:00
public function testWithEmptyContent ()
{
2015-10-11 22:27:47 +02:00
$tagger = $this -> getTaggerMock ();
$tagger -> expects ( $this -> once ())
-> method ( 'tag' );
2015-09-10 21:57:25 +02:00
$graby = $this -> getMockBuilder ( 'Graby\Graby' )
2016-04-12 11:36:01 +02:00
-> setMethods ([ 'fetchContent' ])
2015-09-10 21:57:25 +02:00
-> disableOriginalConstructor ()
-> getMock ();
$graby -> expects ( $this -> any ())
-> method ( 'fetchContent' )
2016-04-12 11:36:01 +02:00
-> willReturn ([
2015-09-20 22:37:27 +02:00
'html' => false ,
'title' => '' ,
'url' => '' ,
'content_type' => '' ,
'language' => '' ,
2016-04-12 11:36:01 +02:00
]);
2015-09-10 21:57:25 +02:00
2017-05-27 22:08:14 +02:00
$proxy = new ContentProxy ( $graby , $tagger , $this -> getLogger (), $this -> fetchingErrorMessage );
2015-09-10 21:57:25 +02:00
$entry = $proxy -> updateEntry ( new Entry ( new User ()), 'http://0.0.0.0' );
$this -> assertEquals ( 'http://0.0.0.0' , $entry -> getUrl ());
$this -> assertEmpty ( $entry -> getTitle ());
2016-12-03 05:59:18 +01:00
$this -> assertEquals ( $this -> fetchingErrorMessage , $entry -> getContent ());
2015-09-10 21:57:25 +02:00
$this -> assertEmpty ( $entry -> getPreviewPicture ());
$this -> assertEmpty ( $entry -> getMimetype ());
2015-09-20 22:37:27 +02:00
$this -> assertEmpty ( $entry -> getLanguage ());
2015-09-28 19:35:33 +02:00
$this -> assertEquals ( 0.0 , $entry -> getReadingTime ());
$this -> assertEquals ( '0.0.0.0' , $entry -> getDomainName ());
2015-09-10 21:57:25 +02:00
}
public function testWithEmptyContentButOG ()
{
2015-10-11 22:27:47 +02:00
$tagger = $this -> getTaggerMock ();
$tagger -> expects ( $this -> once ())
-> method ( 'tag' );
2015-09-10 21:57:25 +02:00
$graby = $this -> getMockBuilder ( 'Graby\Graby' )
2016-04-12 11:36:01 +02:00
-> setMethods ([ 'fetchContent' ])
2015-09-10 21:57:25 +02:00
-> disableOriginalConstructor ()
-> getMock ();
$graby -> expects ( $this -> any ())
-> method ( 'fetchContent' )
2016-04-12 11:36:01 +02:00
-> willReturn ([
2015-09-20 22:37:27 +02:00
'html' => false ,
'title' => '' ,
'url' => '' ,
'content_type' => '' ,
'language' => '' ,
2016-11-18 15:09:21 +01:00
'status' => '' ,
2016-04-12 11:36:01 +02:00
'open_graph' => [
2015-09-20 22:37:27 +02:00
'og_title' => 'my title' ,
'og_description' => 'desc' ,
2016-04-12 11:36:01 +02:00
],
]);
2015-09-10 21:57:25 +02:00
2017-05-27 22:08:14 +02:00
$proxy = new ContentProxy ( $graby , $tagger , $this -> getLogger (), $this -> fetchingErrorMessage );
2015-09-28 19:35:33 +02:00
$entry = $proxy -> updateEntry ( new Entry ( new User ()), 'http://domain.io' );
2015-09-10 21:57:25 +02:00
2015-09-28 19:35:33 +02:00
$this -> assertEquals ( 'http://domain.io' , $entry -> getUrl ());
2015-09-10 21:57:25 +02:00
$this -> assertEquals ( 'my title' , $entry -> getTitle ());
2017-05-05 14:33:36 +02:00
$this -> assertEquals ( $this -> fetchingErrorMessage . '<p><i>But we found a short description: </i></p>desc' , $entry -> getContent ());
2015-09-10 21:57:25 +02:00
$this -> assertEmpty ( $entry -> getPreviewPicture ());
2015-09-20 22:37:27 +02:00
$this -> assertEmpty ( $entry -> getLanguage ());
2016-11-18 15:09:21 +01:00
$this -> assertEmpty ( $entry -> getHttpStatus ());
2015-09-10 21:57:25 +02:00
$this -> assertEmpty ( $entry -> getMimetype ());
2015-09-28 19:35:33 +02:00
$this -> assertEquals ( 0.0 , $entry -> getReadingTime ());
$this -> assertEquals ( 'domain.io' , $entry -> getDomainName ());
2015-09-10 21:57:25 +02:00
}
public function testWithContent ()
{
2015-10-11 22:27:47 +02:00
$tagger = $this -> getTaggerMock ();
$tagger -> expects ( $this -> once ())
-> method ( 'tag' );
2015-09-10 21:57:25 +02:00
$graby = $this -> getMockBuilder ( 'Graby\Graby' )
2016-04-12 11:36:01 +02:00
-> setMethods ([ 'fetchContent' ])
2015-09-10 21:57:25 +02:00
-> disableOriginalConstructor ()
-> getMock ();
$graby -> expects ( $this -> any ())
-> method ( 'fetchContent' )
2016-04-12 11:36:01 +02:00
-> willReturn ([
2015-09-28 19:35:33 +02:00
'html' => str_repeat ( 'this is my content' , 325 ),
2015-09-10 21:57:25 +02:00
'title' => 'this is my title' ,
'url' => 'http://1.1.1.1' ,
'content_type' => 'text/html' ,
2015-09-20 22:37:27 +02:00
'language' => 'fr' ,
2016-11-18 15:09:21 +01:00
'status' => '200' ,
2016-04-12 11:36:01 +02:00
'open_graph' => [
2015-09-10 21:57:25 +02:00
'og_title' => 'my OG title' ,
'og_description' => 'OG desc' ,
2015-09-10 22:00:53 +02:00
'og_image' => 'http://3.3.3.3/cover.jpg' ,
2016-04-12 11:36:01 +02:00
],
]);
2015-09-10 21:57:25 +02:00
2017-05-27 22:08:14 +02:00
$proxy = new ContentProxy ( $graby , $tagger , $this -> getLogger (), $this -> fetchingErrorMessage );
2015-09-10 21:57:25 +02:00
$entry = $proxy -> updateEntry ( new Entry ( new User ()), 'http://0.0.0.0' );
$this -> assertEquals ( 'http://1.1.1.1' , $entry -> getUrl ());
$this -> assertEquals ( 'this is my title' , $entry -> getTitle ());
2015-09-28 19:35:33 +02:00
$this -> assertContains ( 'this is my content' , $entry -> getContent ());
2015-09-10 21:57:25 +02:00
$this -> assertEquals ( 'http://3.3.3.3/cover.jpg' , $entry -> getPreviewPicture ());
$this -> assertEquals ( 'text/html' , $entry -> getMimetype ());
2015-09-20 22:37:27 +02:00
$this -> assertEquals ( 'fr' , $entry -> getLanguage ());
2016-11-18 15:09:21 +01:00
$this -> assertEquals ( '200' , $entry -> getHttpStatus ());
2015-09-28 19:35:33 +02:00
$this -> assertEquals ( 4.0 , $entry -> getReadingTime ());
$this -> assertEquals ( '1.1.1.1' , $entry -> getDomainName ());
2015-09-10 21:57:25 +02:00
}
2015-10-11 22:27:47 +02:00
2017-01-10 17:42:34 +01:00
public function testWithContentAndNoOgImage ()
{
$tagger = $this -> getTaggerMock ();
$tagger -> expects ( $this -> once ())
-> method ( 'tag' );
$graby = $this -> getMockBuilder ( 'Graby\Graby' )
-> setMethods ([ 'fetchContent' ])
-> disableOriginalConstructor ()
-> getMock ();
$graby -> expects ( $this -> any ())
-> method ( 'fetchContent' )
-> willReturn ([
'html' => str_repeat ( 'this is my content' , 325 ),
'title' => 'this is my title' ,
'url' => 'http://1.1.1.1' ,
'content_type' => 'text/html' ,
'language' => 'fr' ,
'status' => '200' ,
'open_graph' => [
'og_title' => 'my OG title' ,
'og_description' => 'OG desc' ,
'og_image' => false ,
],
]);
2017-05-27 22:08:14 +02:00
$proxy = new ContentProxy ( $graby , $tagger , $this -> getLogger (), $this -> fetchingErrorMessage );
2017-01-10 17:42:34 +01:00
$entry = $proxy -> updateEntry ( new Entry ( new User ()), 'http://0.0.0.0' );
$this -> assertEquals ( 'http://1.1.1.1' , $entry -> getUrl ());
$this -> assertEquals ( 'this is my title' , $entry -> getTitle ());
$this -> assertContains ( 'this is my content' , $entry -> getContent ());
$this -> assertNull ( $entry -> getPreviewPicture ());
$this -> assertEquals ( 'text/html' , $entry -> getMimetype ());
$this -> assertEquals ( 'fr' , $entry -> getLanguage ());
$this -> assertEquals ( '200' , $entry -> getHttpStatus ());
$this -> assertEquals ( 4.0 , $entry -> getReadingTime ());
$this -> assertEquals ( '1.1.1.1' , $entry -> getDomainName ());
}
2016-03-27 20:35:56 +02:00
public function testWithForcedContent ()
{
$tagger = $this -> getTaggerMock ();
$tagger -> expects ( $this -> once ())
-> method ( 'tag' );
$graby = $this -> getMockBuilder ( 'Graby\Graby' ) -> getMock ();
2017-05-27 22:08:14 +02:00
$proxy = new ContentProxy ( $graby , $tagger , $this -> getLogger (), $this -> fetchingErrorMessage );
2016-03-27 20:35:56 +02:00
$entry = $proxy -> updateEntry ( new Entry ( new User ()), 'http://0.0.0.0' , [
'html' => str_repeat ( 'this is my content' , 325 ),
'title' => 'this is my title' ,
'url' => 'http://1.1.1.1' ,
'content_type' => 'text/html' ,
'language' => 'fr' ,
]);
$this -> assertEquals ( 'http://1.1.1.1' , $entry -> getUrl ());
$this -> assertEquals ( 'this is my title' , $entry -> getTitle ());
$this -> assertContains ( 'this is my content' , $entry -> getContent ());
$this -> assertEquals ( 'text/html' , $entry -> getMimetype ());
$this -> assertEquals ( 'fr' , $entry -> getLanguage ());
$this -> assertEquals ( 4.0 , $entry -> getReadingTime ());
$this -> assertEquals ( '1.1.1.1' , $entry -> getDomainName ());
}
public function testTaggerThrowException ()
{
$graby = $this -> getMockBuilder ( 'Graby\Graby' )
-> disableOriginalConstructor ()
-> getMock ();
$tagger = $this -> getTaggerMock ();
$tagger -> expects ( $this -> once ())
-> method ( 'tag' )
-> will ( $this -> throwException ( new \Exception ()));
2017-05-27 22:08:14 +02:00
$proxy = new ContentProxy ( $graby , $tagger , $this -> getLogger (), $this -> fetchingErrorMessage );
2016-03-27 20:35:56 +02:00
$entry = $proxy -> updateEntry ( new Entry ( new User ()), 'http://0.0.0.0' , [
'html' => str_repeat ( 'this is my content' , 325 ),
'title' => 'this is my title' ,
'url' => 'http://1.1.1.1' ,
'content_type' => 'text/html' ,
'language' => 'fr' ,
]);
$this -> assertCount ( 0 , $entry -> getTags ());
}
2017-05-12 07:53:21 +02:00
public function dataForCrazyHtml ()
{
return [
'script and comment' => [
'<strong>Script inside:</strong> <!--[if gte IE 4]><script>alert(\'lol\');</script><![endif]--><br />' ,
'lol'
],
'script' => [
'<strong>Script inside:</strong><script>alert(\'lol\');</script>' ,
'script'
],
];
}
/**
* @ dataProvider dataForCrazyHtml
*/
public function testWithCrazyHtmlContent ( $html , $escapedString )
{
$tagger = $this -> getTaggerMock ();
$tagger -> expects ( $this -> once ())
-> method ( 'tag' );
$graby = new Graby ();
$proxy = new ContentProxy ( $graby , $tagger , $this -> getTagRepositoryMock (), $this -> getLogger (), $this -> fetchingErrorMessage );
$entry = $proxy -> updateEntry (
new Entry ( new User ()),
'http://1.1.1.1' ,
[
'html' => $html ,
'title' => 'this is my title' ,
'url' => 'http://1.1.1.1' ,
'content_type' => 'text/html' ,
'language' => 'fr' ,
'status' => '200' ,
'open_graph' => [
'og_title' => 'my OG title' ,
'og_description' => 'OG desc' ,
'og_image' => 'http://3.3.3.3/cover.jpg' ,
],
]
);
$this -> assertEquals ( 'http://1.1.1.1' , $entry -> getUrl ());
$this -> assertEquals ( 'this is my title' , $entry -> getTitle ());
$this -> assertNotContains ( $escapedString , $entry -> getContent ());
$this -> assertEquals ( 'http://3.3.3.3/cover.jpg' , $entry -> getPreviewPicture ());
$this -> assertEquals ( 'text/html' , $entry -> getMimetype ());
$this -> assertEquals ( 'fr' , $entry -> getLanguage ());
$this -> assertEquals ( '200' , $entry -> getHttpStatus ());
$this -> assertEquals ( '1.1.1.1' , $entry -> getDomainName ());
}
2015-10-11 22:27:47 +02:00
private function getTaggerMock ()
{
2017-05-27 22:08:14 +02:00
return $this -> getMockBuilder ( RuleBasedTagger :: class )
2016-04-12 11:36:01 +02:00
-> setMethods ([ 'tag' ])
2015-10-11 22:27:47 +02:00
-> disableOriginalConstructor ()
-> getMock ();
}
2015-10-17 17:45:51 +02:00
2015-10-31 16:38:49 +01:00
private function getLogger ()
2015-10-17 17:45:51 +02:00
{
2015-10-31 16:38:49 +01:00
return new NullLogger ();
2015-10-17 17:45:51 +02:00
}
2015-09-10 21:57:25 +02:00
}