PATH:
home
/
lab2454c
/
keebchat.com
/
core
/
libs
/
htmlParser
/
example
/
scraping
<?php include_once('../../simple_html_dom.php'); function scraping_IMDB($url) { // create HTML DOM $html = file_get_html($url); // get title $ret['Title'] = $html->find('title', 0)->innertext; // get rating $ret['Rating'] = $html->find('div[class="general rating"] b', 0)->innertext; // get overview foreach($html->find('div[class="info"]') as $div) { // skip user comments if($div->find('h5', 0)->innertext=='User Comments:') return $ret; $key = ''; $val = ''; foreach($div->find('*') as $node) { if ($node->tag=='h5') $key = $node->plaintext; if ($node->tag=='a' && $node->plaintext!='more') $val .= trim(str_replace("\n", '', $node->plaintext)); if ($node->tag=='text') $val .= trim(str_replace("\n", '', $node->plaintext)); } $ret[$key] = $val; } // clean up memory $html->clear(); unset($html); return $ret; } // ----------------------------------------------------------------------------- // test it! $ret = scraping_IMDB('http://imdb.com/title/tt0335266/'); foreach($ret as $k=>$v) echo '<strong>'.$k.' </strong>'.$v.'<br>'; ?>
[-] example_scraping_general.php
[edit]
[-] example_scraping_imdb.php
[edit]
[-] example_scraping_digg.php
[edit]
[+]
..
[-] example_scraping_slashdot.php
[edit]