Method | Description | |
---|---|---|
disableCandidateParser ( ) : |
Disable candidates parsing. | |
download ( ) : boolean | Download the HTML content. | |
execute ( $pageContent = '', $recursionDepth ) | Execute the scraper. | |
getEncoding ( ) : string | Get encoding. | |
getFilteredContent ( ) : string | Get filtered relevant content. | |
getParser ( ) : PicoFeed\Scraper\ParserInterface | Get the parser. | |
getRawContent ( ) : string | Get raw content (unfiltered). | |
getRelevantContent ( ) : string | Get relevant content. | |
getUrl ( ) : string | Get URL to download. | |
hasRelevantContent ( ) : boolean | Return true if the scraper found relevant content. | |
prepareHtml ( ) | Normalize encoding and strip head tag. | |
setEncoding ( string $encoding ) : |
Set encoding. | |
setRawContent ( string $html ) : |
Set raw content (unfiltered). | |
setUrl ( string $url ) : |
Set URL to download. |
public disableCandidateParser ( ) : |
||
return |
public getFilteredContent ( ) : string | ||
return | string |
public getParser ( ) : PicoFeed\Scraper\ParserInterface | ||
return | PicoFeed\Scraper\ParserInterface |
public getRawContent ( ) : string | ||
return | string |
public getRelevantContent ( ) : string | ||
return | string |
public hasRelevantContent ( ) : boolean | ||
return | boolean |
public setEncoding ( string $encoding ) : |
||
$encoding | string | |
return |
public setRawContent ( string $html ) : |
||
$html | string | |
return |