1. Go to this page and download the library: Download algolia/php-dom-parser library. Choose the download type require.
2. Extract the ZIP file and open the index.php.
3. Add this code to the index.php.
<?php
require_once('vendor/autoload.php');
/* Start to develop here. Best regards https://php-download.com/ */
algolia / php-dom-parser example snippets
$article = file_get_contents('https://blog.algolia.com/how-we-re-invented-our-office-space-in-paris/');
$parser = new \Algolia\DOMParser();
// Exclude content by CSS selectors.
$parser->setExcludeSelectors(array(
'pre',
'.entry-meta',
'div.rp4wp-related-posts'
));
// Only parse what is inside a given CSS selectors.
// If there are multiple nodes matching, they will all be parsed.
$parser->setRootSelector('article.post');
// Define your attributes sibling.
$parser->setAttributeSelectors(
array(
'title1' => 'h1',
'title2' => 'h2',
'title3' => 'h3',
'title4' => 'h4',
'title5' => 'h5',
'title6' => 'h6',
'content' => 'p, ul, ol, dl, table',
)
);
// Add some attributes that will be part of every record.
$parser->setSharedAttributes(array(
'url' => 'http://www.example.com',
'visits' => 1933,
));
// Turn the DOM into Algolia search friendly records.
$records = $parser->parse($article);
var_dump($records);