<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
 
<html xmlns="http://www.w3.org/1999/xhtml">
 
    <head>
 
<meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
 
<title>Scraper demo</title>
 
</head>
 
<body>    
 
<?php 
 
 
include 'scraper.php';
 
 
/*
 
 * Examples
 
 */
 
 
 
/* comment this line with // to enable example section 
 
 // Example 1
 
 // Scan single page and grab data
 
try 
 
{   
 
    $scrap = new Scraper();
 
    
 
    //set url to scan
 
    $scrap->setBaseUrl('test.html');
 
    
 
    //definition of points where data are 
 
    $scrap->addDataTarget('title', '#product h1');
 
    $scrap->addDataTarget('category', '#product #category');
 
    $scrap->addDataTarget('description', '#product #description');
 
    $scrap->addDataTarget('price', '#product #price');
 
    
 
    //run scan
 
    $data = $scrap->process();
 
    
 
    //show results
 
    var_dump($data);
 
 
}
 
catch (Exception $e)
 
{
 
    echo $e->getMessage();
 
}
 
//*/
 
 
 
///* comment this line with // to enable example section
 
 // Example 2
 
 // Scan base url with range id's
 
   
 
try 
 
{   
 
    $scrap = new Scraper();
 
    
 
    //set base url with token named ##TOKEN##
 
    $scrap->setBaseUrl('http://szukaj.pl.mobile.eu/pojazdy/details.html?id=##TOKEN##');
 
    
 
    //Set the scan range for the token
 
    $scrap->addRangeScanRule(151598039, 151598042, '##TOKEN##');
 
    
 
    //definition of points where data are 
 
    $scrap->addDataTarget('name', '.headline .margin h1');
 
    $scrap->addDataTarget('price', '#buyerpricegross');
 
    $scrap->addDataTarget('image', '#imageWrapper #thumbnailoverlay a');
 
    
 
    
 
    //run
 
    $data = $scrap->process();
 
    
 
    //output
 
    foreach ($data as $row)
 
    {
 
        echo "<strong>Name:</strong> " . $row['name'] . "<br />";
 
        echo "<strong>Price:</strong> " . $row['price'] . "<br />";
 
        echo $row['image'] . "<br />";
 
        echo "<br /> <hr /><br />";        
 
    }
 
    //var_dump($data);
 
 
}
 
catch (Exception $e)
 
{
 
    echo $e->getMessage();
 
}
 
 
//*/
 
 
 
 
 
/* comment this line with // to enable example section
 
 // Example 3
 
 // Scan list of urls
 
try 
 
{
 
    $scrap = new Scraper();
 
    
 
    //define urls to scan
 
    $myUrls = array(
 
        'http://wlasnorecznie.boo.pl/wlasnorecznie/content/ciasteczka',
 
        'http://wlasnorecznie.boo.pl/wlasnorecznie/content/ziarenka-kawy',
 
        'http://wlasnorecznie.boo.pl/wlasnorecznie/content/pacman-3d'
 
    );
 
    
 
    //add urls to scraper
 
    $scrap->addListScanRule($myUrls);
 
    
 
    //define data points
 
    $scrap->addDataTarget('title', '#content .ogloszenie_item h1');
 
    $scrap->addDataTarget('image', '#content .ogloszenie_thumb a');
 
    $scrap->addDataTarget('price', '#content .ogloszenie_item:contains(\'Cena:\')');
 
    
 
    //start
 
    $data = $scrap->process();
 
    
 
    //show results
 
    var_dump($data);
 
}
 
catch (Exception $e)
 
{
 
    echo $e->getMessage();
 
}
 
//*/
 
 
 
?>
 
</body></html>
 
 |