Fetch Html format data from different site link for using cURL.

Component ID

2336053

Component name

Fetch Html format data from different site link for using cURL.

Component type

theme

Maintenance status

Development status

Component security advisory coverage

not-covered

Component created

Component changed

Component body

function pr($array)
{
	echo "<pre>";
		print_r($array);
	echo "</pre>";
}


function regexExtract($text, $regex, $nthValue) 
{	
	if (preg_match($regex, $text, $regs)) { 
	 $result = $regs[$nthValue]; 
	} 
	else { 
	 $result = ""; 
	} 
	return $result; 
} 
ini_set('max_execution_time', 3000000);
require_once('simple_html_dom.php');
$url  = 'URL';//putting on Site url link
if(isset($_GET['page'])){
$page = $_GET['page'];
$postFields = array();
$ch = curl_init();
	curl_setopt($ch, CURLOPT_URL,$url);
	
	curl_setopt($ch, CURLOPT_HTTPHEADER, array('Host:www.kanesheriff.com',
											   'User-Agent: Mozilla/5.0 (Windows NT 6.1; WOW64; rv:31.0) Gecko/20100101 Firefox/31.0',
											   'Accept: text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8',
											   'Accept-Language: en-US,en;q=0.5',
											   'Accept-Encoding: gzip, deflate',
											   'Connection: keep-alive'
											   )
				);
	
	curl_setopt($ch, CURLOPT_COOKIEJAR,true);
	curl_setopt($ch, CURLOPT_RETURNTRANSFER, 1);
	curl_setopt($ch, CURLOPT_FOLLOWLOCATION, 1);
	$text = curl_exec($ch);	

	$regexViewstate = "/__VIEWSTATE" value="(.*)"/i";	
	$viewstate = regexExtract($text,$regexViewstate,1); 
	$regexEventValidation = "/__EVENTVALIDATION" value="(.*)"/i";
	$EVENTVALIDATION = regexExtract($text,$regexEventValidation,1); 
		$postFields['__EVENTTARGET'] = 'ctl00$Content$gvForeclosures';
		$postFields['__EVENTARGUMENT'] = 'Page$'.$page;
		$postFields['__VIEWSTATE']=$viewstate;
		$postFields['__SCROLLPOSITIONX'] = 0;
		$postFields['__SCROLLPOSITIONY'] = 	'';
		$postFields['__EVENTVALIDATION'] = $EVENTVALIDATION;
	$ch       = curl_init();
	curl_setopt($ch, CURLOPT_URL, 'URL');//putting on Site url link
	curl_setopt($ch, CURLOPT_HTTPHEADER, array(
		'Host: www.kanesheriff.com',
		'User-Agent: Mozilla/5.0 (Windows NT 6.1; WOW64; rv:31.0) Gecko/20100101 Firefox/31.0',
		'Accept: text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8',
		'Accept-Language: Accept-Language',
		'Accept-Encoding: gzip, deflate',
		'Referer: http://www.kanesheriff.com/civilDivision/foreclosures.aspx',
		'Connection: keep-alive'
	));
	curl_setopt($ch, CURLOPT_POST, 1);
	curl_setopt($ch, CURLOPT_POSTFIELDS,http_build_query($postFields));
	curl_setopt($ch, CURLOPT_COOKIEJAR, true);
	curl_setopt($ch, CURLOPT_RETURNTRANSFER, 1);
	curl_setopt($ch, CURLOPT_FOLLOWLOCATION, 1);
	$result  = curl_exec($ch);		
	$xhtml = str_get_html($result);	
		$data = array();
	$i=0;
	foreach($xhtml->find('table[id=ctl00_Content_gvForeclosures] > tr[style=color:Black;],tr[style=color:Black;background-color:#FFF6D2;] ') as $tr)
	{				
		$data[$i]['case_number'] = ($tr->find('td',1)->plaintext!=''?$tr->find('td',1)->plaintext:'');		
		$data[$i]['sales_date'] = ($tr->find('td',0)->plaintext!=''?$tr->find('td',0)->plaintext:'');	
		$data[$i]['Sheriff'] = ($tr->find('td',2)->plaintext!=''?$tr->find('td',2)->plaintext:'');				
		$data[$i]['address'] = ($tr->find('td',3)->plaintext!=''?$tr->find('td',3)->plaintext:'');				
		$data[$i]['jud_amt'] = ($tr->find('td',4)->plaintext!=''?$tr->find('td',4)->plaintext:'');				
		$i++;
	}
	
	
	
}	
	else{
	
		$result = file_get_contents($url);
		$xhtml = str_get_html($result);	
	
		//echo $xhtml;
		//die;
		$data = array();
		$i=0;
		foreach($xhtml->find('table > tr ') as $tr)
		{			
			$data[$i]['case_number'] = ($tr->find('td',1)->plaintext!=''?$tr->find('td',1)->plaintext:'');		
			$data[$i]['sales_date'] = ($tr->find('td',0)->plaintext!=''?$tr->find('td',0)->plaintext:'');	
			$data[$i]['Sheriff'] = ($tr->find('td',2)->plaintext!=''?$tr->find('td',2)->plaintext:'');				
			$data[$i]['address'] = ($tr->find('td',3)->plaintext!=''?$tr->find('td',3)->plaintext:'');				
			$data[$i]['jud_amt'] = ($tr->find('td',4)->plaintext!=''?$tr->find('td',4)->plaintext:'');				
			$i++;
		}
		//print_r($data);die;
	if(!empty($data)){
	//state= WI
	
		$i=0;
		unset($data[0]);
		unset($data[21]);
		unset($data[22]);
		foreach($data as $key => $val){
		

}

Sales Date State Case No Sheriff Address Judgment Amt
echo $val['sales_date']; IL echo $val['case_number']; echo $val['Sheriff']; echo $val['address']; echo $val['jud_amt'];
		$link_data .='<div>';			
			
				for($i=1;$i<=28;$i++){
				if($i==1){
					$querystring = '';
				}else{
					$querystring = '?page='.$i;
				}	
				$link_data .='<span style="padding-right:10px;"><a href=civilDivision.php'.$querystring.'>'.$i.'</a></span>';			
	}
	
	
	$link_data .='</div>';
	echo $link_data;
}
	
	}