1. Go to this page and download the library: Download gyaaniguy/pcrawl library. Choose the download type require.
2. Extract the ZIP file and open the index.php.
3. Add this code to the index.php.
<?php
require_once('vendor/autoload.php');
/* Start to develop here. Best regards https://php-download.com/ */
gyaaniguy / pcrawl example snippets
// simple clients.
$gu = new GuzzleClient();
// Custom Client, that does not allow redirects.
$uptightNoRedirectClient = new CurlClient();
$uptightNoRedirectClient->setRedirects(0); // disable redirects
// Custom client - thin wrapper around curl
class ConvertToHttpsClient extends CurlClient
{
public function get(string $url, array $options = []): PResponse
{
$url = str_replace('http://', 'https://', $url);
return parent::get($url, $options);
}
}
$redirectDetector = new ResponseDebug();
$redirectDetector->setMustNotExistHttpCodes([301, 302, 303, 307, 308]);
$fullPageDetector = new ResponseDebug();
$fullPageDetector->setMustExistRegex(['#</html>#']);
$req = new Request();
$url = "http://www.whatsmyua.info";
$req->setClient($uptightNoRedirectClient);
$count = 0;
do {
$res = $req->get($url);
$redirectDetector->setResponse($res);
if ($redirectDetector->isFail()) {
var_dump($redirectDetector->getFailDetail());
$uptightNoRedirectClient->setRedirects(1);
$res = $req->get($url);
}
} while ($redirectDetector->isFail() && $count++ < 1);
if ($fullPageDetector->setResponse($res)->isFail()) {
var_dump($redirectDetector->getFailDetail());
} else {
$parser = new ParserCommon($res->getBody());
$h1 = $parser->find('h1')->text();
$htmlClass = $parser->find('html')->attr('class');
}
Loading please wait ...
Before you can download the PHP files, the dependencies should be resolved. This can take some minutes. Please be patient.