1naveengiri · November 15, 2018 14:46
diff --git a/xpath.php b/xpath.php
 <?php 
 /**
 * Function to extract content from html. 
 * $html HTML data 
 * $expression Expression used to extract the data ex. //div[@id='breadcrumbs']/span
 */
 function extract_content_from_html( $html, $expression ){
 	$dom = new DOMDocument();
 	$output = '';
 	libxml_use_internal_errors( true );
 	$dom->loadHTML( $html );
 	libxml_clear_errors();
 	try{
 		$xml    = simplexml_import_dom( $dom );
 	} catch(Exception $e) {
 		$error =  'Message: ' .$e->getMessage();
 		error_log( $error );
 	}
 	$result = $xml->xpath( $expression );
 	$domXPath = new DOMXPath($dom);
 	$domNodeList = $domXPath->query($expression);
 	$domDocument = new DOMDocument(); 

 	if( !empty( $domNodeList ) ): 
 		foreach ($domNodeList as $node) {
 			$domDocument->appendChild($domDocument->importNode($node, true)); 
 		}
 		$content = $domDocument->saveHTML(); 
 		$output = $content;

 	else:
 		$output = __( 'No match found.', 'wpscraper' );
 	endif;
 	return $output;
 }
	<?php
	/**
	* Function to extract content from html.
	* $html HTML data
	* $expression Expression used to extract the data ex. //div[@id='breadcrumbs']/span
	*/
	function extract_content_from_html( $html, $expression ){
	$dom = new DOMDocument();
	$output = '';
	libxml_use_internal_errors( true );
	$dom->loadHTML( $html );
	libxml_clear_errors();
	try{
	$xml = simplexml_import_dom( $dom );
	} catch(Exception $e) {
	$error = 'Message: ' .$e->getMessage();
	error_log( $error );
	}
	$result = $xml->xpath( $expression );
	$domXPath = new DOMXPath($dom);
	$domNodeList = $domXPath->query($expression);
	$domDocument = new DOMDocument();

	if( !empty( $domNodeList ) ):
	foreach ($domNodeList as $node) {
	$domDocument->appendChild($domDocument->importNode($node, true));
	}
	$content = $domDocument->saveHTML();
	$output = $content;

	else:
	$output = __( 'No match found.', 'wpscraper' );
	endif;
	return $output;
	}
No results found