PHP simple_html_dom类代码示例

OGeek|极客世界-中国程序员成长平台 › 门户 › 编程› PHP›PHP编程经验

原作者: [db:作者] 来自: [db:来源] 收藏邀请

本文整理汇总了PHP中simple_html_dom类的典型用法代码示例。如果您正苦于以下问题：PHP simple_html_dom类的具体用法？PHP simple_html_dom怎么用？PHP simple_html_dom使用的例子？那么恭喜您, 这里精选的类代码示例或许可以为您提供帮助。

在下文中一共展示了simple_html_dom类的20个代码示例，这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞，您的评价将有助于我们的系统推荐出更棒的PHP代码示例。

示例1: handleDocumentInfo

 function handleDocumentInfo($DocInfo)
 {
     echo "Page requested: " . $DocInfo->url . " (" . $DocInfo->http_status_code . ")" . PHP_EOL;
     if ($DocInfo->http_status_code == '200' and $DocInfo->received and $DocInfo->content_type == 'text/html' and isset($DocInfo->content)) {
         $html = $DocInfo->content;
         $host = $DocInfo->host;
         $urlPosted = $DocInfo->url;
         $htmldom = new simple_html_dom();
         $htmldom->load($html);
         $data = array();
         $images = $htmldom->find('ul#ListViewInner li img');
         echo 'Total images' . count($images) . '' . PHP_EOL;
         $i = 0;
         foreach ($images as $raw_links) {
             echo $raw_links->alt . "','1','" . $raw_links->src . "\n";
             $filename = '_e__' . $i . '.jpg';
             copy(str_replace("l225 ", "l900", $raw_links->src), 'downloads/' . $filename);
             $i++;
         }
         echo json_encode($data) . PHP_EOL;
         //$writer->writeRow(json_encode($data));
         unset($data);
         unset($htmldom);
     }
 }

开发者ID:natzar，项目名称:Robin，代码行数:25，代码来源:ebayClass.php

示例2: parse

 public function parse($isUpdate = false)
 {
     Ibos::import("application.extensions.simple_html_dom", true);
     if ($isUpdate) {
         $model = preg_replace("/\\s+data-id\\s?=\\s?\"?\\d+\"?/i", "", $this->printmodel);
         $max = 0;
     } else {
         $model = $this->printmodel;
         $max = intval($this->itemmax);
     }
     $elements = array();
     $doc = new simple_html_dom();
     $doc->load($model, true, true, CHARSET);
     $items = $doc->find("ic");
     $config = $this->getItemConfig();
     if (!empty($items) && !empty($config)) {
         $this->refactor($items, $config, $max, $elements);
     }
     $html = $doc->save();
     $this->_cache = $elements;
     CacheUtil::set("form_" . $this->ID, $elements);
     $form["printmodelshort"] = $html;
     if ($max != $this->itemmax) {
         $form["itemmax"] = $max;
     }
     $doc->clear();
     FlowFormType::model()->modify($this->ID, $form);
 }

开发者ID:AxelPanda，项目名称:ibos，代码行数:28，代码来源:SimpleHtmlParser.php

示例3: run_ml

function run_ml($q_num = 0)
{
    $html = scraperWiki::scrape("http://musiklegal.com/search/result/a/" . $q_num);
    $dom = new simple_html_dom();
    $dom->load($html);
    foreach ($dom->find("tr") as $data) {
        $tds = $data->find("td");
        $temp_data = explode('">', str_replace('</<strong>a</strong>>', '', str_replace('<<strong>a</strong> href="http://musiklegal.com/song/detail/', '', $tds[1]->plaintext)));
        $record = array('No' => str_replace('.', '', $tds[0]->plaintext), 'Code' => $temp_data[0], 'Song Title' => $temp_data[1], 'Artist' => $tds[2]->plaintext, 'Album' => $tds[3]->plaintext);
        /*
         *  Stores results
         */
        scraperwiki::save_sqlite(array("No"), $record);
        unset($temp_data);
    }
    foreach ($dom->find("a") as $a) {
        if ($a->plaintext == 'Next') {
            $tmp_a = $a->href;
            $tmp_a = str_replace('http://musiklegal.com/search/result/a/', '', $tmp_a);
            if ($tmp_a > 0) {
                continue;
            }
        }
    }
    if ((int) $tmp_a != 0) {
        run_ml($tmp_a);
    } else {
        exit;
    }
}

开发者ID:flyeven，项目名称:scraperwiki-scraper-vault，代码行数:30，代码来源:other_scraper_ml.php

示例4: getMoviesUrl

 /**
  * 動画のURLを取得する
  *
  * @param  simple_html_dom $html
  * @return array
  **/
 public function getMoviesUrl($html)
 {
     $query = 'div.entryBody div.topmore a img';
     $movies_els = $html->find($query);
     $movie_data = array();
     $manager = new UriManager();
     // 動画はこちらテキストのリンクを取得する
     foreach ($movies_els as $movies_el) {
         if (!preg_match('/^動画.+/', $movies_el->getAttribute('alt'))) {
             continue;
         }
         // 親のaタグからリンクを取得する
         $parent_el = $next_el = $movies_el->parentNode();
         $i = 0;
         while ($i < 3) {
             $next_el = $next_el->nextSibling();
             if (is_null($next_el)) {
                 break;
             }
             $i++;
         }
         if ($next_el->nodeName() == 'span') {
             $movie_data = [];
             break;
         }
         if ($parent_el->nodeName() == 'a') {
             $movie_data[] = $manager->resolve($parent_el->getAttribute('href'));
         }
     }
     return $movie_data;
 }

开发者ID:kknet，项目名称:AdultMidnight，代码行数:37，代码来源:Ichizen.php

示例5: getProducts

function getProducts($u, $cat)
{
    global $o;
    $d = new simple_html_dom();
    $d->load(scraperwiki::scrape($u));
    //echo "Loaded URL: " . $u . "\n";
    $items = $d->find('li.grid-item');
    if (count($items) > 0) {
        foreach ($items as $p) {
            $prod = $p->find('p.product-name > a', 0);
            $prodname = trim($prod->innertext);
            $prodURL = $prod->href;
            if (!is_null($p->find('p.minimal-price', 0))) {
                $prodtype = 1;
            } else {
                $prodtype = 0;
            }
            fputcsv($o, array($prodname, $prodtype, $cat, $prodURL));
            echo $prodname . "\n";
        }
        if (!is_null($d->find('p.next', 0))) {
            getProducts($d->find('p.next', 0)->href, $cat);
        }
    }
}

开发者ID:jbm160，项目名称:brs，代码行数:25，代码来源:productlist.php

示例6: get_data

 /**
  * curl 访问 开奖数据
  */
 private function get_data()
 {
     include_once 'simplehtmldom_1_5/simple_html_dom.php';
     $simple_html_dom = new \simple_html_dom();
     //zlib 解压 并转码
     $data = false;
     $data = @file_get_contents("compress.zlib://" . self::URL);
     if (!$data) {
         $this->setLog(false, '重庆时时彩-开奖数据抓取失败');
         exit('重庆时时彩-数据抓取失败,请尽快联系网站管理员' . "\r\n");
     }
     //转换成 UTF-8编码
     $encode = mb_detect_encoding($data, array('ASCII', 'UTF-8', 'GB2312', "GBK", 'BIG5'));
     $content = iconv($encode, 'UTF-8', $data);
     $simple_html_dom->load($content);
     //开奖期号
     $qihao = $simple_html_dom->find('div[class=aside]', 0)->find('h3', 0)->find('em', 0)->plaintext;
     //开奖号
     $code = $simple_html_dom->find('div[class=aside]', 0)->find('div[class=mod-aside mod-aside-xssckj]', 0)->find('div[class=bd]', 0)->find('div[class=kpkjcode]', 0)->find('table', 0)->find('tr', 1)->find('td', 1)->plaintext;
     if ($code == '--') {
         exit('重庆时时彩-等待开奖...' . "\r\n");
     }
     $isKaiJiang = $simple_html_dom->find('div[class=aside]', 0)->find('div[class=mod-aside mod-aside-xssckj]', 0)->find('div[class=bd]', 0)->find('div[class=kpkjcode]', 0)->find('table', 0)->find('tr', 1)->find('td', 2)->plaintext;
     if ($isKaiJiang == '--' && $isKaiJiang == '开奖中') {
         exit('重庆时时彩-等待开奖...' . "\r\n");
     }
     $simple_html_dom->clear();
     //将开奖号中间的空格去掉
     $code = str_replace(" ", '', $code);
     //开奖时间
     $kjsj = date('Y-m-d H:i:s');
     $this->data = ['qihao' => $qihao, 'kjsj' => $kjsj, 'code' => $code];
 }

开发者ID:aiyeyun，项目名称:grab，代码行数:36，代码来源:GrabCqSsc.php

示例7: getMoviesUrl

 /**
  * 動画のURLを取得する
  *
  * @param  simple_html_dom $html
  * @return array
  **/
 public function getMoviesUrl($html)
 {
     $query = 'div.ently_body div.ently_text div.video-container iframe';
     $movies_els = $html->find($query);
     $movie_data = array();
     $manager = new UriManager();
     // 動画はこちらテキストのリンクを取得する
     foreach ($movies_els as $movies_el) {
         if ($movies_el->hasAttribute('src')) {
             $url = $manager->resolve($movies_el->getAttribute('src'));
             if ($url !== false) {
                 $movie_data[] = $url;
             }
         }
     }
     $query = 'div.ently_outline div.ently_body a';
     $movies_els = $html->find($query);
     foreach ($movies_els as $movies_el) {
         $text = $movies_el->plaintext;
         if (preg_match('/リンク（/', $text) && $movies_el->hasAttribute('href')) {
             $resolve_url = $manager->resolve($movies_el->getAttribute('href'));
             if ($resolve_url) {
                 $movie_data[] = $resolve_url;
             }
         }
     }
     return $movie_data;
 }

开发者ID:kknet，项目名称:AdultMidnight，代码行数:34，代码来源:EroEro.php

示例8: do_day

function do_day($rec)
{
    $html = scraperwiki::scrape($rec['url']);
    $dom = new simple_html_dom();
    $dom->load($html);
    $cell = $dom->find('a[name=discs]');
    $lines = $cell[0]->parent->find('text');
    print $lines[10] . "\n";
    print count($lines) . "\n";
    # loop by number, as null lines stop a foreach
    $n = 0;
    for ($line_no = 0; $line_no < count($lines); $line_no++) {
        $line = $lines[$line_no];
        if (strlen($line) == 3) {
            # the DOM object crashes on this row, so ignore
            continue;
        }
        #if (preg_match("#^" . $n . "#", $line, $matches)) {
        print $line_no . " " . strlen($line) . "\n";
        $n = $n + 1;
        print $line . "\n";
        #}
    }
    #scraperwiki::save(array('data'), array('data' => $data->plaintext));
}

开发者ID:flyeven，项目名称:scraperwiki-scraper-vault，代码行数:25，代码来源:desert-island-disc-records.php

示例9: compile

 /**
  * Compile a template file by reading it, converting the DOM using
  * {@see convert()}, then applying macros using {@see transform()}.
  * @param string $template Template file path.
  * @return string PHP template content. 
  * @throws InvalidTemplateException If template is inaccessible or invalid.
  */
 public function compile($template)
 {
     $dom = new \simple_html_dom();
     $this->currentTemplate = $template;
     $file = file_get_contents($template);
     if ($file === false) {
         throw new InvalidTemplateException(tr('Could not read template: %1', $template));
     }
     if (!$dom->load($file, true, false)) {
         throw new InvalidTemplateException(tr('Could not parse template: %1', $template));
     }
     $root = new InternalNode();
     $main = $dom->find('[j:main]', 0);
     if (isset($main)) {
         $root->append($this->convert($main));
     } else {
         foreach ($dom->find('*, text') as $html) {
             if ($html->parent->tag != 'root') {
                 continue;
             }
             $root->append($this->convert($html));
         }
     }
     $this->transform($root);
     return $root->__toString();
 }

开发者ID:jivoo，项目名称:jivoo，代码行数:33，代码来源:TemplateCompiler.php

示例10: scrapPage

function scrapPage($page)
{
    print "Scraping page " . $page;
    $url = "http://www.geipan.fr/index.php?id=202";
    $fields_string = "&no_cache=1&" . "tx_geipansearch_pi1%5Bsubmit_form%5D=1&" . "tx_geipansearch_pi1%5Btexte_resume%5D=&" . "tx_geipansearch_pi1%5Bdate_debut%5D=&" . "tx_geipansearch_pi1%5Bdate_fin%5D=&" . "no_cache=1&" . "tx_geipansearch_pi1%5Bclasse_cas%5D=tous&" . "tx_geipansearch_pi1%5Bregion%5D=&" . "page=" . $page . "&" . "order_by=&" . "sens=";
    $curl = curl_init($url);
    curl_setopt($curl, CURLOPT_RETURNTRANSFER, true);
    curl_setopt($curl, CURLOPT_FOLLOWLOCATION, true);
    curl_setopt($curl, CURLOPT_MAXREDIRS, 10);
    curl_setopt($curl, CURLOPT_SSL_VERIFYPEER, false);
    curl_setopt($curl, CURLOPT_TIMEOUT, 20);
    curl_setopt($curl, CURLOPT_POST, 11);
    curl_setopt($curl, CURLOPT_POSTFIELDS, $fields_string);
    $html = curl_exec($curl);
    print curl_error($curl) . "\n";
    //      print($html);
    $dom = new simple_html_dom();
    $dom->load($html);
    $trs = $dom->find("tr");
    foreach ($trs as $tr) {
        if (isset($tr->attr['onclick'])) {
            $ID = substr($tr->attr['onclick'], strpos($tr->attr['onclick'], "cas=") + 4, 13);
            print $ID . "\n";
            $tds = $tr->find("td");
            $title = utf8_encode($tds[0]->plaintext);
            $date = $tds[1]->plaintext;
            $departement = utf8_encode($tds[2]->plaintext);
            $classe = $tds[3]->plaintext;
            $maj = $tds[4]->plaintext;
            $city = substr($title, 0, strpos($title, "(") - 1);
            $record = array('ID' => $ID, 'title' => $title, 'date' => $date, 'departement' => $departement, 'classe' => $classe, 'maj' => $maj, 'city' => $city);
            scraperwiki::save(array('ID', 'maj'), $record);
        }
    }
}

开发者ID:flyeven，项目名称:scraperwiki-scraper-vault，代码行数:35，代码来源:geipan.php

示例11: getSearchResults

 public function getSearchResults(simple_html_dom $dom)
 {
     $result = array();
     $count = count($dom->find('div.srg'));
     if ($count) {
         // if found div.srg
         $c = $count > 1 ? 1 : 0;
         // if this is first page, we have 2 divs, first with some irrelevant
         //links, so skip the first page
         $d = $dom->find('div.srg', $c);
         // get second div(if this is 1st page), or first div
     } else {
         // no div.srg found, search all page
         $d = $dom;
     }
     foreach ($d->find('div.rc') as $div) {
         $a = $div->find('h3.r a', 0);
         // get link to the website
         //Get original image url
         $originalImg = $div->find('div.th a', 0);
         preg_match('/imgurl=(.+?)&/', $originalImg->href, $matches);
         $result[] = array(htmlspecialchars_decode($a->plaintext, ENT_QUOTES), $a->href, $matches[1]);
     }
     return $result;
 }

开发者ID:gigikiri，项目名称:GoogleImageSearch，代码行数:25，代码来源:GoogleImageSearch.php

示例12: scrape_page

function scrape_page()
{
    $row = 0;
    $html = scraperWiki::scrape("http://asuntojen.hintatiedot.fi/haku/?c=" . $GLOBALS['c'] . "&s=" . $GLOBALS['s'] . "&r=" . $GLOBALS['r'] . "&amin=" . $GLOBALS['amin'] . "&amax=" . $GLOBALS['amax'] . "&z=" . $GLOBALS['z']);
    $dom = new simple_html_dom();
    $dom->load($html);
    foreach ($dom->find("tr") as $data) {
        $tds = $data->find("td");
        if (count($tds) > 8) {
            $row++;
            $GLOBALS['rowTotal']++;
            $apt = array("Uniikkiavain" => $GLOBALS['rowTotal'], "Kaupunginosa" => $tds[0]->plaintext, "Myyntihinta" => $tds[3]->plaintext, "Neliohinta" => $tds[4]->plaintext, "Tyyppi" => $tds[1]->plaintext, "Koko" => $tds[2]->plaintext);
            scraperwiki::save_sqlite(null, $apt, $table_name = $GLOBALS['c'] . " " . $GLOBALS['time']);
            print $GLOBALS['rowTotal'] . "\n";
            print $row . ". Sijainti: " . $tds[0]->plaintext . " Hinta: " . $tds[3]->plaintext . " Tyyppi: " . $tds[1]->plaintext . " Koko: " . $tds[2]->plaintext . " Neliöhinta: " . $tds[4]->plaintext . "€" . "\n";
        }
    }
    if ($row == 50) {
        print "Vielä jatkuu, haetaan seuraava sivu..." . "\n";
        $GLOBALS['z']++;
        scrape_page();
    } else {
        print "Skrääpiminen suoritettu." . "\n";
        print "Sivuja yhteensä: " . $GLOBALS['z'] . "\n";
        print "Rivejä yhteensä: " . $GLOBALS['rowTotal'] . "\n";
    }
}

开发者ID:flyeven，项目名称:scraperwiki-scraper-vault，代码行数:27，代码来源:asuntojen_hintatiedot_1.php

示例13: save

 public function save($html, $dir)
 {
     import("@.ORG.htmltodocx.documentation.support_functions");
     $phpword_object = new PHPWord();
     $section = $phpword_object->createSection();
     // HTML Dom object:
     $html_dom = new simple_html_dom();
     $html_dom->load('<html><body>' . $html . '</body></html>');
     // Note, we needed to nest the html in a couple of dummy elements.
     // Create the dom array of elements which we are going to work on:
     $html_dom_array = $html_dom->find('html', 0)->children();
     // We need this for setting base_root and base_path in the initial_state array
     // (below). We are using a function here (derived from Drupal) to create these
     // paths automatically - you may want to do something different in your
     // implementation. This function is in the included file
     // documentation/support_functions.inc.
     $paths = htmltodocx_paths();
     // Provide some initial settings:
     $initial_state = array('phpword_object' => &$phpword_object, 'base_root' => $paths['base_root'], 'base_path' => $paths['base_path'], 'current_style' => array('size' => '11'), 'parents' => array(0 => 'body'), 'list_depth' => 0, 'context' => 'section', 'pseudo_list' => TRUE, 'pseudo_list_indicator_font_name' => 'Wingdings', 'pseudo_list_indicator_font_size' => '7', 'pseudo_list_indicator_character' => 'l ', 'table_allowed' => TRUE, 'treat_div_as_paragraph' => TRUE, 'style_sheet' => htmltodocx_styles_example());
     // Convert the HTML and put it into the PHPWord object
     htmltodocx_insert_html($section, $html_dom_array[0]->nodes, $initial_state);
     // Clear the HTML dom object:
     $html_dom->clear();
     unset($html_dom);
     // Save File
     $str = explode(".", $h2d_file_uri);
     $h2d_file_uri = $dir . "wordtemp/" . time() . ".docx";
     if (!file_exists($dir . "wordtemp/")) {
         $this->createFolders($dir . "wordtemp/");
         //判断目标文件夹是否存在
     }
     $objWriter = PHPWord_IOFactory::createWriter($phpword_object, 'Word2007');
     $objWriter->save($h2d_file_uri);
     return $h2d_file_uri;
 }

开发者ID:tmlsoft，项目名称:main，代码行数:35，代码来源:HtmlToDocx.php

示例14: handleDocumentInfo

 function handleDocumentInfo($DocInfo)
 {
     //	global $writer;
     echo "Page requested: " . $DocInfo->url . " (" . $DocInfo->http_status_code . ")" . PHP_EOL;
     if ($DocInfo->http_status_code == '200' and $DocInfo->received and $DocInfo->content_type == 'text/html' and isset($DocInfo->content)) {
         $html = $DocInfo->content;
         $host = $DocInfo->host;
         $urlPosted = $DocInfo->url;
         $htmldom = new simple_html_dom();
         $htmldom->load($html);
         $data = array();
         $images = $htmldom->find('.pinHolder img');
         echo 'Total Images ' . count($images) . PHP_EOL;
         $i = intval(Date("YmdHis"));
         foreach ($images as $raw_links) {
             $data['items'][] = array("title" => $raw_links->alt, "img" => $raw_links->src);
             copy($raw_links->src, 'downloads/' . $i . '.jpg');
             $i++;
         }
         echo json_encode($data) . PHP_EOL;
         //$writer->writeRow(json_encode($data));
         unset($data);
         unset($htmldom);
     }
 }

开发者ID:natzar，项目名称:Robin，代码行数:25，代码来源:pinterestClass.php

示例15: parsing

 private function parsing($scrappedData)
 {
     $result = [];
     //Create a DOM parser object
     $html = new simple_html_dom();
     //Parse the HTML from Amazon.
     $html->load($scrappedData);
     # Iterate over all the  tags
     foreach ($html->find('li[class=s-result-item]') as $key => $innerData) {
         //image
         foreach ($innerData->find('img[class=s-access-image]') as $img) {
             $atmp['image'] = $img->getAttribute('src');
         }
         //title
         foreach ($innerData->find('h2[class=s-access-title]') as $title) {
             $atmp['title'] = $title->innertext();
         }
         //price
         foreach ($innerData->find('span[class=s-price]') as $price) {
             $price = $price->innertext();
             $atmp['price'] = $price;
             $atmp['numPrice'] = str_replace(",", '', substr($price, 1));
         }
         //total page
         foreach ($html->find('span[class=pagnDisabled]') as $maxPage) {
             $atmp['totalPage'] = $maxPage->innertext();
         }
         # Show the <a href>
         if (isset($atmp)) {
             $result[$key] = $atmp;
         }
     }
     return $this->aResult = $result;
 }

开发者ID:rahulpr，项目名称:Scrap-amazon，代码行数:34，代码来源:scrap_amazon.php

示例16: scrapeTEDRSS

function scrapeTEDRSS($url, $sector)
{
    print $url . " " . $sector . "\n";
    // $xml = scraperWiki::scrape($url);
    $curl = curl_init($url);
    curl_setopt($curl, CURLOPT_RETURNTRANSFER, true);
    curl_setopt($curl, CURLOPT_FOLLOWLOCATION, true);
    curl_setopt($curl, CURLOPT_MAXREDIRS, 10);
    curl_setopt($curl, CURLOPT_SSL_VERIFYPEER, false);
    curl_setopt($curl, CURLOPT_TIMEOUT, 20);
    // 10 second before aborting
    // try CURLOPT_CONNECTTIMEOUT (in seconds)
    // try CURLOPT_LOW_SPEED_LIMIT (to define what slow is, with):
    // curl_setopt($curl, CURLOPT_LOW_SPEED_TIME, 10); (10 second at low speed before aborting
    $xml = curl_exec($curl);
    print curl_error($curl) . "\n";
    $dom = new simple_html_dom();
    $dom->load($xml);
    $items = $dom->find("item");
    foreach ($items as $item) {
        $guid = $item->find("guid");
        $noticeURL = str_replace("TEXT", "DATA", $guid[0]->plaintext);
        print $noticeURL . " " . $sector . " " . memory_get_usage() / 1000000 . "MB";
        echo "\n";
        // $record = scrapeTEDDataPage ($noticeURL, $sector);
        $record = array('time' => microtime(true), 'sector' => $sector, 'url' => $noticeURL);
        scraperwiki::save(array('sector', 'url'), $record);
        sleep(1);
    }
    $dom->__destruct();
    unset($items);
    unset($dom);
    unset($xml);
    print memory_get_usage() / 1024 / 1024 . "MB\n";
}

开发者ID:flyeven，项目名称:scraperwiki-scraper-vault，代码行数:35，代码来源:dk-ted.php

示例17: parsing

 protected function parsing($input)
 {
     include_once "inc/simple_html_dom.php";
     # Create a DOM parser object
     $html = new simple_html_dom();
     # Parse the HTML from Amazon.
     $html->load($input);
     $result = [];
     # Iterate over all the  tags
     foreach ($html->find('li[class=s-result-item]') as $key => $innerData) {
         //image
         foreach ($innerData->find('img[class=s-access-image]') as $img) {
             $atmp['image'] = $img->getAttribute('src');
         }
         //title
         foreach ($innerData->find('h2[class=s-access-title]') as $title) {
             $atmp['title'] = $title->innertext();
         }
         //price
         foreach ($innerData->find('span[class=s-price]') as $price) {
             $price = $price->innertext();
             $atmp['price'] = $price;
             $atmp['numPrice'] = str_replace(",", '', substr($price, 1));
         }
         # Show the <a href>
         $result[$key] = $atmp;
     }
     if (!empty($result)) {
         return $this->aResult = $result;
     }
 }

开发者ID:kavyavsagar，项目名称:Scrap-Amazon，代码行数:31，代码来源:search.php

示例18: grep_munich

function grep_munich($url, $table_name)
{
    $html = scraperWiki::scrape($url);
    $count = 0;
    # Use the PHP Simple HTML DOM Parser to extract <td> tags
    $dom = new simple_html_dom();
    $dom->load($html);
    //Drop all old informations by dropping the table
    scraperwiki::sqliteexecute("drop table if exists " . $table_name);
    scraperwiki::sqlitecommit();
    $table = $dom->getElementById('flight_info_area');
    foreach ($table->find('tr') as $data) {
        // Flight details. Read tds or ths
        $tds = $data->find("td");
        //if there are less then 7 columns continue to next loop
        if (sizeof($tds) < 7) {
            continue;
        }
        //print $data->plaintext . "\n";
        $flightnr = $tds[1]->plaintext;
        $from = $tds[2]->plaintext;
        $time = $tds[3]->plaintext;
        $expected_time = $tds[4]->plaintext;
        //Create date
        $date = date("Y-m-d");
        //Build array of flight informations
        $flight_data = array("date" => $date, "count" => $count, "flightnr" => $flightnr, "from" => $from, "time" => $time, "expected_time" => $expected_time);
        //Save the informations of one flight
        scraperwiki::save_sqlite(array("date", "count"), $flight_data, $table_name);
        $count = $count + 1;
    }
}

开发者ID:flyeven，项目名称:scraperwiki-scraper-vault，代码行数:32，代码来源:munich_airport.php

示例19: scrapeHTML

function scrapeHTML($param, $type)
{
    $html = scraperWiki::scrape("http://www.norwegian.no/fly/lavpris/?D_City=CPH&A_City=DUB&TripType=2&D_Day=1&D_Month=201104&R_Day=1&R_Month=201104&AdultCount=1&ChildCount=0&InfantCount=0");
    $dom = new simple_html_dom();
    $dom->load($html);
    // Iterate over table rows and get flight details.
    foreach ($dom->find("TR[@HEIGHT='25']") as $data) {
        // Flight details.
        $tds = $data->find("div");
        $airline = removeSpaces($tds[0]->plaintext);
        $flight_type = $type;
        $flight_num = removeSpaces($tds[1]->plaintext);
        $destination = removeSpaces($tds[2]->plaintext);
        $time = removeSpaces($tds[3]->plaintext);
        $gate = removeSpaces($tds[4]->plaintext);
        $remarks = removeSpaces($tds[5]->plaintext);
        // Skip header row. Cheesy, but effective.
        if ($airline == "Airline") {
            continue;
        }
        // Set the date.
        $date = date("m.d.y");
        // Build up record to store.
        $flight_data = array("date" => $date, "airline" => $airline, "flight_type" => $flight_type, "flight_num" => $flight_num, "destination" => $destination, "time" => $time, "gate" => $gate, "remarks" => $remarks);
        // Save the record.
        saveData(array("date", "airline", "flight_type", "flight_num"), $flight_data);
    }
    $dom->clear();
}

开发者ID:flyeven，项目名称:scraperwiki-scraper-vault，代码行数:29，代码来源:phl-flight-scraperphp.php

示例20: get_dom

function get_dom($url)
{
    $html = scraperWiki::scrape($url);
    $dom = new simple_html_dom();
    $dom->load($html);
    return $dom;
}

开发者ID:flyeven，项目名称:scraperwiki-scraper-vault，代码行数:7，代码来源:testing_scraper.php

注：本文中的simple_html_dom类示例整理自Github/MSDocs等源码及文档管理平台，相关代码片段筛选自各路编程大神贡献的开源项目，源码版权归原作者所有，传播和使用请参考对应项目的License；未经允许，请勿转载。

鲜花

握手

雷人

路过

鸡蛋

该文章已有0人参与评论

请发表评论

全部评论

专题导读

More+

10-27 六六分期app的软件客服如何联系？(六六分期

11-06 可心卡盟:win10系统火狐flash插件崩溃怎么

11-06 亲亲特价:怎么删除回收站图标

11-06 济南大学虚拟社区:鲁大师节能降温的具体办

11-06 xlueops.exe:无线网络安装向导

11-06 女斗合众国:win7系统cf与主机连接不稳定怎

11-06 0xc000022-[cf烟雾头]cf怎么调烟雾头

11-06 qizideyouhuo:应用程序无法正常启动0xc0000

11-06 ipz-185:win7系统vcf文件怎么打开

11-06 傻哥蹦迪:win10系统s4怎么打开usb调试

11-06 八神浩树gtaste:回收站清空了怎么恢复

11-06 妖尾之黑色守护:win10系统电脑没有1440x900

11-06 校园至尊魔王小说:win7系统浏览网页时字体

11-06 女斗合众国:win10系统访问共享文件夹提示请

11-06 tokyo hot n0654:恢复win7系统默认字体一招

11-06 雨酷仙境:设置win7系统转移临时文件夹腾出

11-06 阿穆纳伊之杖:win7系统开始菜单在右边还原

11-06 tunespotting:win10系统火狐flash插件总是

11-06 甘尔葛分析师：计谋网站seo关键词暴涨有什

11-06 蔡贵霖: 计谋网站seo关键词暴涨有什么秘密

11-06 博益网首页:ao3网页版进入不了解决方法

11-06 漏斗子专栏: 网站数据分析小白易懂精华篇

11-06 见证双虹怎么做:win7系统开启telnet命令的

11-06 颾狐蝶蜋:系统资源不足无法完成请求的服务

11-06 国光中学校歌:提交网站到alexa查询详细步骤

11-06 西安有情天:静态网页和动态网页的区别

11-06 红木雅尚斋:外部链接构造对网站的好处

11-06 前官礼遇：防止域名劫持–增强域安全性的10

11-06 密传二转答案: 中文分词算法有哪些

11-06 金泉家园邮编:百度快照劫持的表现及应对方

PHP single_button类代码示例发布时间：2022-05-23

PHP simbio_table类代码示例发布时间：2022-05-23

bradtraversy/iweather: Ionic 3 mobile we

1 PacktPublishing/Python-Machine-Learning-

PacktPublishing/Python-Machine-Learning-Second-Edition: Python Machine Learning

阅读：927|2022-08-18

2 BentoBoxWorld/AOneBlock: A OneBlock Mine

BentoBoxWorld/AOneBlock: A OneBlock Minecraft Game for BentoBox

阅读：538|2022-08-17

3 鲁东大学一米网:Win7系统USB驱动器RAM的操

win7系统电脑使用过程中有不少朋友表示遇到过win7系统USB驱动器RAM的状况，当出现win7

阅读：832|2022-11-06

4 manur/MATLAB-git: A thin MATLAB wrapper

manur/MATLAB-git: A thin MATLAB wrapper for the Git source control system

阅读：396|2022-08-17

5 我学Delphi心得及笔记----常用问题与解决方

1、弹出窗体要想在一个窗体中弹出另一个窗体，方法如下：uses窗体单元名;formName.sho

阅读：546|2022-07-18

6 nstudio/nativescript-cardview: NativeScr

nstudio/nativescript-cardview: NativeScript widget for Material Design CardView

阅读：528|2022-08-17

7 CVE-2022-33637

Microsoft Defender for Endpoint Tampering Vulnerability.

阅读：544|2022-07-29

8 elipapa/markdown-cv: a simple template t

elipapa/markdown-cv: a simple template to write your CV in a readable markdown f

阅读：483|2022-08-17

9 ravdy/kubernetes

ravdy/kubernetes

阅读：544|2022-08-13

10 卡莉·蕾·吉普森是谁?不雅录像是怎么回事?

Call Me Maybe 中英字幕对于加拿大歌手卡莉·蕾·吉普森很多人有些陌生，她隶属于贾

阅读：571|2022-11-06

客服电话

电子邮件

PHP simple_html_dom类代码示例

示例1: handleDocumentInfo

示例2: parse

示例3: run_ml

示例4: getMoviesUrl

示例5: getProducts

示例6: get_data

示例7: getMoviesUrl

示例8: do_day

示例9: compile

示例10: scrapPage

示例11: getSearchResults

示例12: scrape_page

示例13: save

示例14: handleDocumentInfo

示例15: parsing

示例16: scrapeTEDRSS

示例17: parsing

示例18: grep_munich

示例19: scrapeHTML

示例20: get_dom

请发表评论

全部评论

上一篇：

下一篇：

GitbookIO/gitbook:

juleswhite/mobile-cloud-asgn1

kyamagu/matlab-json: Use official API: h

墙壁眼睛膝盖

sevenjay/cpp-markdown: Cpp-Markdown is a

bradtraversy/iweather: Ionic 3 mobile we

joaomh/curso-de-matlab

断牙刷新位置时间（断牙属性及刷新位置介绍

关于微信小程序 张小龙宣布微

rugk/mastodon-simplified-federation: Sim

CVE-2022-34639

关于我们

产品与服务

解决方案

139-2527-9053

关于微信小程序张小龙宣布微